improved HTML indexing make the queries also lookup the HTML based indexes * doc/index.py: improved HTML indexing * doc/search.php: make the queries also lookup the HTML based indexes Daniel

commit: 9b00613d0583e2bca7589257bc32984d5b358a10 [log] [tgz]
author: Daniel Veillard <veillard@src.gnome.org> Mon Oct 07 11:13:27 2002 +0000
committer: Daniel Veillard <veillard@src.gnome.org> Mon Oct 07 11:13:27 2002 +0000
tree: 2d0b6b388776e66867ead72e0cf6c1dd28af2f4b
parent: 141d04ba749f93490561b8253794b99490b801eb [diff] [blame]
diff --git a/doc/index.py b/doc/index.py
index 2cca7c0..e3b8588 100755
--- a/doc/index.py
+++ b/doc/index.py

@@ -717,6 +717,15 @@
 
 import glob
 
+def analyzeHTMLText(doc, resource, p, section, id):
+    words = 0
+    try:
+	content = p.content
+	words = words + addStringHTML(content, resource, id, section, 5)
+    except:
+        return -1
+    return words
+
 def analyzeHTMLPara(doc, resource, p, section, id):
     words = 0
     try:
@@ -735,6 +744,15 @@
         return -1
     return words
 
+def analyzeHTML(doc, resource, p, section, id):
+    words = 0
+    try:
+	content = p.content
+	words = words + addStringHTML(content, resource, id, section, 5)
+    except:
+        return -1
+    return words
+
 def analyzeHTML(doc, resource):
     para = 0;
     ctxt = doc.xpathNewContext()
@@ -745,7 +763,7 @@
         title = "Page %s" % (resource)
     addPage(resource, title)
     try:
-	items = ctxt.xpathEval("//h1 | //h2 | //h3 | //p | //pre")
+	items = ctxt.xpathEval("//h1 | //h2 | //h3 | //text()")
 	section = title
 	id = ""
 	for item in items:
@@ -755,7 +773,10 @@
 		    id = item.prop("id")
 		elif item.prop("name"):
 		    id = item.prop("name")
-	    elif item.name == 'p':
+	    elif item.type == 'text':
+	        analyzeHTMLText(doc, resource, item, section, id)
+		para = para + 1
+	    elif item.name == 'text':
 	        analyzeHTMLPara(doc, resource, item, section, id)
 		para = para + 1
 	    elif item.name == 'pre':
commit	9b00613d0583e2bca7589257bc32984d5b358a10	[log] [tgz]
author	Daniel Veillard <veillard@src.gnome.org>	Mon Oct 07 11:13:27 2002 +0000
committer	Daniel Veillard <veillard@src.gnome.org>	Mon Oct 07 11:13:27 2002 +0000
tree	2d0b6b388776e66867ead72e0cf6c1dd28af2f4b
parent	141d04ba749f93490561b8253794b99490b801eb [diff] [blame]