1 | | |
2 | | |
3 | | |
4 | | |
5 | | |
6 | | |
7 | | |
8 | | |
9 | | |
10 | | |
11 | | |
12 | | |
13 | | |
14 | | |
15 | | |
16 | | |
17 | | |
18 | | |
19 | | |
20 | | |
21 | | |
22 | | |
23 | | |
24 | | |
25 | | |
26 | | |
27 | | |
28 | | |
29 | | |
30 | | |
31 | | |
32 | | |
33 | | |
34 | | |
35 | | |
36 | | |
37 | | |
38 | | |
39 | | |
40 | | |
41 | | |
42 | | |
43 | | |
44 | | |
45 | | |
46 | | |
47 | | |
48 | | |
49 | | |
| | | | | | inherit Search.Filter.HTML; | | constant contenttypes = ({ "application/msword", "application/vnd.ms-word" }); | constant fields = ({ "body", "title", "keywords"}); | | Output filter(Standards.URI uri, string|Stdio.File data, string content_type) | { | Output res=Output(); | | if(objectp(data)) | data=data->read(); | | string fn = tmp_filename(); | object f = Stdio.File(fn, "wct"); | int r = f->write(data); | f->close(); | if(r != sizeof(data)) | error("Failed to write data for %O (returned %O, not %O)\n", | fn, r, sizeof(data)); | | string text; | string bin = combine_path(getcwd(), "modules/search/bin/wvWare"); | string cwd = combine_path(getcwd(), "modules/search/bin"); | string xml = combine_path(getcwd(), "modules/search/pike-modules/" | "Search.pmod/Filter.pmod/wvHtml.xml"); | string doc = combine_path(getcwd(), fn); | mixed err = catch | { | text = my_popen( ({ bin, "-c", "utf-8", "-x", xml, doc }), cwd); | }; | if(!rm(fn)) | werror("Search: Failed to remove temporary file: %s\n", fn); | if(err) | throw(err); | | return ::filter(uri, text, "text/html", ([]), "utf-8"); | } | | string _sprintf() | { | return "Search.Filter.Word"; | } | | |
|