IndexerDiagram.cd
上传用户:huiyue
上传日期:2022-04-08
资源大小:1429k
文件大小:9k
源码类别:

搜索引擎

开发平台:

ASP/ASPX

  1. <?xml version="1.0" encoding="utf-8"?>
  2. <ClassDiagram MajorVersion="1" MinorVersion="1">
  3.   <Font Name="Tahoma" Size="8.25" />
  4.   <Comment CommentText="Parsing code has been extracted from the Spider class and moved into Document classes. &#xD;&#xA;&#xD;&#xA;The Spider class only knows about the DocumentFactory and Document classes. It assumes the subclasses will take care of downloading Uri and parsing it into an array of Words (and other properties) that the spider can add to the Catalog.&#xD;&#xA;&#xD;&#xA;The Catalog doesn't remember the Document, it just keeps File and Word references (see other diagram)">
  5.     <Position X="3.75" Y="2.104" Height="2.26" Width="2.158" />
  6.   </Comment>
  7.   <Comment CommentText="Filter document refers to a document that will be opened via the IFilter interface (but IFilterDocument would have been a bad class name)">
  8.     <Position X="7.604" Y="9.604" Height="0.99" Width="1.7" />
  9.   </Comment>
  10.   <Comment CommentText="PDF document subclasses FilterDocument so we can intercept the file and access it with other code (eg iTextSharp)&#xD;&#xA;&#xD;&#xA;Added [v7]">
  11.     <Position X="7.604" Y="10.802" Height="1.198" Width="1.7" />
  12.   </Comment>
  13.   <Comment CommentText="DownloadDocument is any non-text file type that cannot easily be indexed without first saving the file to disk">
  14.     <Position X="8.896" Y="6.01" Height="0.844" Width="1.565" />
  15.   </Comment>
  16.   <Class Name="Searcharoo.Common.Document">
  17.     <Position X="1.75" Y="0.5" Width="1.5" />
  18.     <TypeIdentifier>
  19.       <FileName>IndexerDocumentsDocument.cs</FileName>
  20.       <HashCode>CiAgAAQIAAAgAEQAAIACAABAAKAEkUAEDYAQgAARgAA=</HashCode>
  21.     </TypeIdentifier>
  22.     <Compartments>
  23.       <Compartment Name="Methods" Collapsed="true" />
  24.     </Compartments>
  25.   </Class>
  26.   <Class Name="Searcharoo.Common.TextDocument">
  27.     <Position X="2.25" Y="7" Width="1.5" />
  28.     <TypeIdentifier>
  29.       <FileName>IndexerDocumentsTextDocument.cs</FileName>
  30.       <HashCode>AAAgAAAAAAAAAAAAAAAAAAAAAAAEEEAAAIAAgAAAQAA=</HashCode>
  31.     </TypeIdentifier>
  32.     <Members>
  33.       <Field Name="_All" Hidden="true" />
  34.       <Field Name="_WordsOnly" Hidden="true" />
  35.       <Method Name="TextDocument" Hidden="true" />
  36.     </Members>
  37.   </Class>
  38.   <Class Name="Searcharoo.Common.DocumentFactory">
  39.     <Position X="3.75" Y="0.5" Width="1.5" />
  40.     <TypeIdentifier>
  41.       <FileName>IndexerDocumentsDocumentFactory.cs</FileName>
  42.       <HashCode>AAAAAAAAAAKAACAAAAAAAAAAAAAEAAAAAAAAAAAAAAA=</HashCode>
  43.     </TypeIdentifier>
  44.   </Class>
  45.   <Class Name="Searcharoo.Common.FilterDocument">
  46.     <Position X="6" Y="7.75" Width="1.5" />
  47.     <TypeIdentifier>
  48.       <FileName>IndexerDocumentsFilterDocument.cs</FileName>
  49.       <HashCode>AAAgAAAAAAAAAAAAAAAEAAAAAAAEMEAAAIAAgAAAQAA=</HashCode>
  50.     </TypeIdentifier>
  51.     <Members>
  52.       <Field Name="_All" Hidden="true" />
  53.       <Field Name="_WordsOnly" Hidden="true" />
  54.       <Method Name="FilterDocument" Hidden="true" />
  55.     </Members>
  56.   </Class>
  57.   <Class Name="Searcharoo.Common.HtmlDocument">
  58.     <Position X="4" Y="7" Width="1.5" />
  59.     <TypeIdentifier>
  60.       <FileName>IndexerDocumentsHtmlDocument.cs</FileName>
  61.       <HashCode>CgAgAAAAAgCwAAAEAAACCAAAgIAEAEAECIAQgAAQwAA=</HashCode>
  62.     </TypeIdentifier>
  63.     <Members>
  64.       <Field Name="_All" Hidden="true" />
  65.       <Field Name="_ContentType" Hidden="true" />
  66.       <Field Name="_Description" Hidden="true" />
  67.       <Field Name="_MimeType" Hidden="true" />
  68.       <Field Name="_RobotFollowOK" Hidden="true" />
  69.       <Field Name="_RobotIndexOK" Hidden="true" />
  70.       <Field Name="_Title" Hidden="true" />
  71.       <Field Name="_Uri" Hidden="true" />
  72.       <Field Name="_WordsOnly" Hidden="true" />
  73.       <Field Name="Encoding" Hidden="true" />
  74.       <Method Name="HtmlDocument" Hidden="true" />
  75.       <Method Name="ToString" Hidden="true" />
  76.     </Members>
  77.     <Compartments>
  78.       <Compartment Name="Fields" Collapsed="true" />
  79.     </Compartments>
  80.   </Class>
  81.   <Class Name="Searcharoo.Common.IgnoreDocument">
  82.     <Position X="0.5" Y="7" Width="1.5" />
  83.     <TypeIdentifier>
  84.       <FileName>IndexerDocumentsIgnoreDocument.cs</FileName>
  85.       <HashCode>AAAgAAAAAAAAAAAAAAAAAAAAAAAEAAAAAAAAgAAAAAA=</HashCode>
  86.     </TypeIdentifier>
  87.     <Members>
  88.       <Method Name="IgnoreDocument" Hidden="true" />
  89.     </Members>
  90.   </Class>
  91.   <Class Name="Searcharoo.Indexer.ProgressEventArgs">
  92.     <Position X="10.75" Y="0.5" Width="1.5" />
  93.     <TypeIdentifier>
  94.       <FileName>IndexerProgressEventArgs.cs</FileName>
  95.       <HashCode>AAAAAQAAAAAgAAAEAAAAAAAAABAAAAAFAAAAIAAAAAA=</HashCode>
  96.     </TypeIdentifier>
  97.   </Class>
  98.   <Class Name="Searcharoo.Indexer.RobotsTxt">
  99.     <Position X="8.75" Y="2.5" Width="1.5" />
  100.     <TypeIdentifier>
  101.       <FileName>IndexerRobotsTxt.cs</FileName>
  102.       <HashCode>QAAAAgAAAAAAAAAAIABAAAAAAAAAAAAAACAAAAAAAgA=</HashCode>
  103.     </TypeIdentifier>
  104.     <NestedTypes>
  105.       <Class Name="Searcharoo.Indexer.RobotsTxt.RobotInstruction" Collapsed="true">
  106.         <TypeIdentifier>
  107.           <NewMemberFileName>IndexerRobotsTxt.cs</NewMemberFileName>
  108.         </TypeIdentifier>
  109.       </Class>
  110.     </NestedTypes>
  111.   </Class>
  112.   <Class Name="Searcharoo.Indexer.Spider">
  113.     <Position X="6.75" Y="1.25" Width="1.5" />
  114.     <TypeIdentifier>
  115.       <FileName>IndexerSpider.cs</FileName>
  116.       <HashCode>AeABQAIQgAAAAAQAQCCAAAAAAAAAgAAEBAEAQgAAAAA=</HashCode>
  117.     </TypeIdentifier>
  118.     <ShowAsAssociation>
  119.       <Field Name="_Catalog" />
  120.       <Field Name="_Robot" />
  121.     </ShowAsAssociation>
  122.     <Members>
  123.       <Field Name="_CookieContainer" Hidden="true" />
  124.       <Field Name="_GoChecker" Hidden="true" />
  125.       <Field Name="_Stemmer" Hidden="true" />
  126.       <Field Name="_Stopper" Hidden="true" />
  127.       <Field Name="_Visited" Hidden="true" />
  128.       <Field Name="_VisitedHashtable" Hidden="true" />
  129.     </Members>
  130.     <AssociationLine Name="_Catalog" Type="Searcharoo.Common.Catalog" FixedFromPoint="true" FixedToPoint="true">
  131.       <Path>
  132.         <Point X="8.25" Y="1.335" />
  133.         <Point X="9.562" Y="1.335" />
  134.         <Point X="9.562" Y="1.009" />
  135.       </Path>
  136.       <MemberNameLabel ManuallyPlaced="true">
  137.         <Position X="0.05" Y="0.391" />
  138.       </MemberNameLabel>
  139.     </AssociationLine>
  140.     <AssociationLine Name="_Robot" Type="Searcharoo.Indexer.RobotsTxt" FixedFromPoint="true" FixedToPoint="true">
  141.       <Path>
  142.         <Point X="8.25" Y="2.25" />
  143.         <Point X="9.5" Y="2.25" />
  144.         <Point X="9.5" Y="2.5" />
  145.       </Path>
  146.     </AssociationLine>
  147.   </Class>
  148.   <Class Name="Searcharoo.Common.Catalog" Collapsed="true">
  149.     <Position X="8.75" Y="0.5" Width="1.5" />
  150.     <TypeIdentifier>
  151.       <FileName>CommonCatalog.cs</FileName>
  152.       <HashCode>AAIggIAAAAEAAQAEAAAAAABAAIAABEAAAAQAAgAgAog=</HashCode>
  153.     </TypeIdentifier>
  154.   </Class>
  155.   <Class Name="Searcharoo.Common.DocxDocument">
  156.     <Position X="8" Y="7.75" Width="1.5" />
  157.     <TypeIdentifier>
  158.       <FileName>IndexerDocumentsDocxDocument.cs</FileName>
  159.       <HashCode>AAAgAAAAAAAAAAAAAAAAAAAAAAAEAAAAAAAAgAAAQAA=</HashCode>
  160.     </TypeIdentifier>
  161.     <Members>
  162.       <Field Name="_WordsOnly" Hidden="true" />
  163.       <Method Name="DocxDocument" Hidden="true" />
  164.     </Members>
  165.   </Class>
  166.   <Class Name="Searcharoo.Common.DownloadDocument">
  167.     <Position X="6.75" Y="6" Width="2" />
  168.     <TypeIdentifier>
  169.       <FileName>IndexerDocumentsDownloadDocument.cs</FileName>
  170.       <HashCode>AAAAAAAAQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA=</HashCode>
  171.     </TypeIdentifier>
  172.     <InheritanceLine Type="Searcharoo.Common.Document" FixedFromPoint="true" FixedToPoint="true">
  173.       <Path>
  174.         <Point X="2.5" Y="6.189" />
  175.         <Point X="2.5" Y="6.625" />
  176.         <Point X="6.75" Y="6.625" />
  177.       </Path>
  178.     </InheritanceLine>
  179.   </Class>
  180.   <Class Name="Searcharoo.Common.PdfDocument">
  181.     <Position X="6" Y="10.75" Width="1.5" />
  182.     <TypeIdentifier>
  183.       <FileName>IndexerDocumentsPdfDocument.cs</FileName>
  184.       <HashCode>AAAAAAAAAAAAAAAAAAAAAAAAAAAEAAAAAAAAAAAAAAA=</HashCode>
  185.     </TypeIdentifier>
  186.   </Class>
  187.   <Class Name="Searcharoo.Common.PptxDocument">
  188.     <Position X="9.75" Y="7.75" Width="1.5" />
  189.     <TypeIdentifier>
  190.       <FileName>IndexerDocumentsPptxDocument.cs</FileName>
  191.       <HashCode>AAAgAAAAAAAAAAAAAAAAAAAAAAAEAAAAAAAAgAAAQAA=</HashCode>
  192.     </TypeIdentifier>
  193.     <Members>
  194.       <Method Name="PptxDocument" Hidden="true" />
  195.     </Members>
  196.   </Class>
  197.   <Enum Name="Searcharoo.Indexer.Level">
  198.     <Position X="10.75" Y="4.75" Width="1.5" />
  199.     <TypeIdentifier>
  200.       <FileName>IndexerProgressEventArgs.cs</FileName>
  201.       <HashCode>AAAAAABAAIAAAAAAAAABAAAABAAAAAAEAAAAAAEAAAA=</HashCode>
  202.     </TypeIdentifier>
  203.   </Enum>
  204.   <Delegate Name="Searcharoo.Indexer.SpiderProgressEventHandler">
  205.     <Position X="10.75" Y="3.5" Width="1.5" />
  206.     <TypeIdentifier>
  207.       <FileName>IndexerProgressEventArgs.cs</FileName>
  208.       <HashCode>AAAAAAAAAAAAAAQAAAAAAAAQAAAAAAAAAAAAAAAAAAA=</HashCode>
  209.     </TypeIdentifier>
  210.   </Delegate>
  211. </ClassDiagram>