diff --git a/HTMLparser.c b/HTMLparser.c
index 6ebbded4..132c7d9f 100644
--- a/HTMLparser.c
+++ b/HTMLparser.c
@@ -1,5 +1,14 @@
/*
- * HTMLparser.c : an HTML 4.0 non-verifying parser
+ * HTMLparser.c : an HTML parser
+ *
+ * References:
+ * HTML Living Standard
+ * https://html.spec.whatwg.org/multipage/parsing.html
+ *
+ * Tokenization now conforms to HTML5. Tree construction still follows
+ * a custom, non-standard implementation. See:
+ *
+ * https://gitlab.gnome.org/GNOME/libxml2/-/issues/211
*
* See Copyright for the status of this software.
*