|
a/src/doc/user/usermanual.sgml |
|
b/src/doc/user/usermanual.sgml |
|
... |
|
... |
4186 |
<varlistentry>
|
4186 |
<varlistentry>
|
4187 |
<term>Extractor.textextract(ipath)</term>
|
4187 |
<term>Extractor.textextract(ipath)</term>
|
4188 |
<listitem>Extract document defined
|
4188 |
<listitem>Extract document defined
|
4189 |
by <replaceable>ipath</replaceable> and return
|
4189 |
by <replaceable>ipath</replaceable> and return
|
4190 |
a <literal>Doc</literal> object. The doc.text field
|
4190 |
a <literal>Doc</literal> object. The doc.text field
|
4191 |
has the document text as either text/plain or
|
4191 |
has the document text converted to either text/plain or
|
4192 |
text/html according to doc.mimetype. The typical use
|
4192 |
text/html according to doc.mimetype. The typical use
|
4193 |
would be as follows:
|
4193 |
would be as follows:
|
4194 |
<programlisting>
|
4194 |
<programlisting>
|
4195 |
qdoc = query.fetchone()
|
4195 |
qdoc = query.fetchone()
|
4196 |
extractor = recoll.Extractor(qdoc)
|
4196 |
extractor = recoll.Extractor(qdoc)
|
4197 |
text = extractor.textextract(qdoc.ipath)</programlisting>
|
4197 |
doc = extractor.textextract(qdoc.ipath)
|
|
|
4198 |
# use doc.text, e.g. for previewing
|
|
|
4199 |
</programlisting>
|
4198 |
</listitem>
|
4200 |
</listitem>
|
4199 |
</varlistentry>
|
4201 |
</varlistentry>
|
4200 |
<varlistentry>
|
4202 |
<varlistentry>
|
4201 |
<term>Extractor.idoctofile(ipath, targetmtype, outfile='')</term>
|
4203 |
<term>Extractor.idoctofile(ipath, targetmtype, outfile='')</term>
|
4202 |
<listitem>Extracts document into an output file,
|
4204 |
<listitem>Extracts document into an output file,
|