1
  
2
  
3
  
4
  
5
  
6
  
7
  
8
  
9
  
10
  
11
  
12
  
13
  
14
  
15
  
16
  
17
  
18
  
19
  
20
  
21
  
22
  
23
  
24
  
25
  
26
  
27
  
28
  
29
  
30
  
31
  
32
  
33
  
34
  
35
  
36
  
37
  
38
  
39
  
40
  
41
  
42
  
43
  
44
  
45
  
46
  
47
  
48
  
49
  
50
  
array(Standards.URI) index_document(Search.Database.MySQL db, 
                                    string|Standards.URI uri, 
                                    string|Stdio.File data, 
                                    string content_type, 
                                    void|string language) 
{ 
  Search.Filter.Base filter=Search.get_filter(content_type); 
  if(!filter) 
    throw("No indexer for content type "+content_type); 
 
  Search.Filter.Base.Output filteroutput=filter->filter(uri, data, content_type); 
  // Tokenize and normalize all the non-anchor fields 
  foreach(indices(filteroutput->fields), string field) 
    db->insert_words(uri, language, field, 
                     Search.Utils.tokenize(Search.Utils.normalize 
                                           (filteroutput->fields[field]))); 
 
  // Tokenize any anchor fields 
 
  int source_hash=hash((string)uri)&0xf; 
  foreach(indices(filteroutput->uri_anchors || ({ })), string link_uri) 
  { 
    array(string) words= 
      Search.Utils.tokenize(Search.Utils.normalize(filteroutput->uri_anchors[link_uri])); 
    db->insert_words(link_uri, 0, 0, words, source_hash); 
  } 
  return filteroutput->links; 
} 
 
array(Standards.URI) extract_links(Search.Database.MySQL db, 
                                   string|Standards.URI uri, 
                                   string|Stdio.File data, 
                                   string content_type) 
{ 
  Search.Filter.Base filter=Search.get_filter(content_type); 
  if(!filter) 
    throw("No indexer for content type "+content_type); 
 
  Search.Filter.Base.Output filteroutput=filter->filter(uri, data, content_type); 
  return filteroutput->links; 
} 
 
void remove_document(Search.Database.MySQL db, 
                     string|Standards.URI|string uri, 
                     void|string language) 
{ 
  db->remove_document(uri, language); 
}