Compute lucene-style scores for our hits.
[beagle.git] / Filters / FilterSpreadsheet.cs
blob07174190222891605e76848b9d09c8600dcfa795
1 //
2 // FilterSpreadSheet.cs
3 //
4 // Copyright (C) 2004 Novell, Inc.
5 //
7 //
8 // Permission is hereby granted, free of charge, to any person obtaining a
9 // copy of this software and associated documentation files (the "Software"),
10 // to deal in the Software without restriction, including without limitation
11 // the rights to use, copy, modify, merge, publish, distribute, sublicense,
12 // and/or sell copies of the Software, and to permit persons to whom the
13 // Software is furnished to do so, subject to the following conditions:
15 // The above copyright notice and this permission notice shall be included in
16 // all copies or substantial portions of the Software.
18 // THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
19 // IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
20 // FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
21 // AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
22 // LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
23 // FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
24 // DEALINGS IN THE SOFTWARE.
27 using System;
28 using System.Diagnostics;
29 using System.IO;
30 using System.Xml;
32 using Beagle.Util;
33 using Beagle.Daemon;
35 namespace Beagle.Filters {
37 public class FilterSpreadsheet : Filter {
39 XmlTextReader xmlReader;
40 bool ignoredFirst2lines = false;
41 public FilterSpreadsheet ()
43 SnippetMode = true;
44 AddSupportedFlavor (FilterFlavor.NewFromMimeType ("application/x-gnumeric"));
45 AddSupportedFlavor (FilterFlavor.NewFromMimeType ("application/csv"));
46 AddSupportedFlavor (FilterFlavor.NewFromMimeType ("application/tab-separated-values"));
47 AddSupportedFlavor (FilterFlavor.NewFromMimeType ("text/comma-separated-values"));
48 AddSupportedFlavor (FilterFlavor.NewFromMimeType ("text/csv"));
49 AddSupportedFlavor (FilterFlavor.NewFromMimeType ("text/spreadsheet"));
50 AddSupportedFlavor (FilterFlavor.NewFromMimeType ("text/tab-separated-values"));
51 AddSupportedFlavor (FilterFlavor.NewFromMimeType ("text/x-comma-separated-values"));
52 AddSupportedFlavor (FilterFlavor.NewFromMimeType ("application/vnd.ms-excel"));
53 AddSupportedFlavor (FilterFlavor.NewFromMimeType ("application/excel"));
54 AddSupportedFlavor (FilterFlavor.NewFromMimeType ("application/x-msexcel"));
55 AddSupportedFlavor (FilterFlavor.NewFromMimeType ("application/x-excel"));
58 void WalkContentNodes (XmlReader reader)
60 while (reader.Read ()) {
61 switch (reader.NodeType) {
62 case XmlNodeType.Text:
63 AppendText (reader.Value);
64 AppendStructuralBreak ();
65 break;
70 override protected void DoOpen (FileInfo info)
72 ignoredFirst2lines = false;
75 override protected void DoPull ()
77 // create new external process
78 Process pc = new Process ();
79 pc.StartInfo.FileName = "ssindex";
81 pc.StartInfo.Arguments = String.Format ("-i \"{0}\"", FileInfo.FullName);
82 pc.StartInfo.RedirectStandardInput = false;
83 pc.StartInfo.RedirectStandardOutput = true;
84 pc.StartInfo.UseShellExecute = false;
85 try {
86 pc.Start ();
87 } catch (System.ComponentModel.Win32Exception) {
88 Logger.Log.Warn ("Unable to find ssindex in path; {0} file not indexed.",
89 FileInfo.FullName);
90 Finished ();
91 return;
94 // process ssindex output
95 StreamReader pout = pc.StandardOutput;
96 if (!ignoredFirst2lines) {
97 pout.ReadLine ();
98 pout.ReadLine ();
99 xmlReader = new XmlTextReader (pout);
100 ignoredFirst2lines = true;
102 try {
103 WalkContentNodes (xmlReader);
104 } catch (Exception e) {
105 Logger.Log.Debug ("Exception occurred while indexing {0}.", FileInfo.FullName);
106 Logger.Log.Debug (e);
108 pout.Close ();
109 pc.WaitForExit ();
110 pc.Close ();
111 Finished ();
114 override protected void DoClose ()
116 if (xmlReader != null)
117 xmlReader.Close ();