Module: BrowserWebData::EntitySumarizationConfig
- Included in:
- BrowserWebData::EntitySumarization::NIFLineParser, BrowserWebData::EntitySumarization::Predicate, BrowserWebData::EntitySumarization::PredicatesSimilarity, BrowserWebData::EntitySumarization::Statistic
- Defined in:
- lib/config/entity_sumarization_config.rb
Constant Summary collapse
- IDENTICAL_PROPERTY_LIMIT =
0.8- IMPORTANCE_TO_IDENTIFY_MAX_COUNT =
250- NO_SENSE_PROPERTIES =
%w( http://xmlns.com/foaf/0.1/primaryTopic http://dbpedia.org/ontology/wikiPageRedirects http://dbpedia.org/ontology/wikiPageDisambiguates http://dbpedia.org/ontology/wikiPageRevisionID http://dbpedia.org/ontology/wikiPageID http://www.w3.org/2002/07/owl#sameAs http://www.w3.org/2000/01/rdf-schema#seeAlso http://www.w3.org/2002/07/owl#differentFrom http://dbpedia.org/ontology/wikiPageExternalLink http://xmlns.com/foaf/0.1/depiction )
- COMMON_PROPERTIES =
%W( http://dbpedia.org/ontology/thumbnail http://xmlns.com/foaf/0.1/name http://www.w3.org/2000/01/rdf-schema#label http://dbpedia.org/property/name http://dbpedia.org/property/commonName http://dbpedia.org/property/title http://www.w3.org/2000/01/rdf-schema#comment http://dbpedia.org/ontology/abstract )
- SCAN_REGEXP =
{ begin_index: /(beginIndex).*"(\d+)"/, end_index: /(endIndex).*"(\d+)"/, scan_resource: /<(http:\/\/dbpedia.org\/resource\/(.*))>/, target_resource_link: /(taIdentRef).*<(.*)>/, anchor: /(anchorOf).*"(.*)"/, section: / .*(nif=.*\d)/, group: /(\w+)_(\d+)_(\d+)/, identical_key: /<(http:\/\/[0-9a-zA-z\/._]*)>/ }