Download this file

html.sh    37 lines (27 with data), 1.0 kB

 1
 2
 3
 4
 5
 6
 7
 8
 9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
#!/bin/sh
topdir=`dirname $0`/..
. $topdir/shared.sh
initvariables $0
(
recollq QMapConstIterator
recollq Qtextedit Widget Provides Powerful Single-Page
recollq '"This is the Mysql reference manual"'
# Tests that the charset spec is correctly recognised inside badhtml.html
recollq -a 'etonne badhtml'
# Tests field extraction/storage and indexing
recollq -m -q "testfield:testfieldvalue" | egrep 'results|^text/html|^testfield ='
# more unaccenting tests
recollq -q 'effaranteUTF8HTML'
recollq -q 'effrayanteUTF8HTML'
recollq -q 'accentueesUTF8HTML'
recollq -q 'accentueesISOHTML'
recollq -q html5charsetaccentue
# Stripping trade mark and copyright signs
recollq -q filename:signs.html Registered Trademark Copyright SoundCopyright
# Text in malformed html (before or after body) should be indexed anyway...
recollq -q BADHTMLTEXTBEFOREBODY
recollq -q BADHTMLTEXTINSECONDBODY
recollq -q BADHTMLTEXTAFTERBODY
) 2> $mystderr | egrep -v '^Recoll query: ' > $mystdout
diff -w ${myname}.txt $mystdout > $mydiffs 2>&1
checkresult