First of all, a huge thanks to Alex Savy for translating this! I highly recommend you follow Alex as he’s at the top of his game in the affiliate space.
<aside> 🚨 For next-level SEO tips, subscribe to SEO Notebook for free!
</aside>
This leak has revealed 1,922 ranking factors of Yandex used in its search algorithm, at least as of July 2022.
This note contains the first 1000 factors. The most interesting ones are highlighted in red. The remaining factors will be added at a later date.
Original file - https://webmarketingschool.com/wp-content/uploads/2023/01/factors_gen.txt
Now, the factors:
Factor {
Index: 0
CppName: "FI_PAGE_RANK"
Name: "PR"
Wiki: "<https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/PageRank>"
AntiSeoUpperBound: 1.0
Tags: [TG_DOC, TG_LINK_GRAPH, TG_STATIC, TG_L2, TG_UNUSED]
Description: "Page rank. The factor is remapped."
Authors: "aavdonkin"
Responsibles: "aavdonkin"
}
Factor {
Index: 1
CppName: "FI_TEXT_RELEV"
Name: "TR"
AntiSeoUpperBound: 0.95
Group: "LegacyTR"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_REARR_USE, TG_UNDOCUMENTED, TG_NN_OVER_FEATURES_USE]
Description: "Text relevance (maxfreq - is the frequency of the most frequent word based on the length of the document)."
Authors: ["gulin", "iseg", "leo", "maslov"]
Responsibles: ["gulin", "leo", "maslov"]
}
Factor {
Index: 2
CppName: "FI_LINK_RELEV"
Name: "LR"
AntiSeoUpperBound: 1.0
Group: "Dynamic"
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: "Link relevance. The factor is remapped."
Authors: ["aavdonkin", "gulin", "leshch", "melkov"]
Responsibles: ["aavdonkin", "gulin", "melkov"]
}
Factor {
Index: 3
CppName: "FI_PAGE_RANK_BONUS"
Name: "PrBonus"
Wiki: "<https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/PageRankBonus>"
Group: "Dynamic"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_BINARY, TG_OFTEN_ZERO, TG_NN_OVER_FEATURES_USE]
Description: "Priority bonus, priority 7 - text priority. The factor is binary, with a value of 0 for all single-word queries, and a value of 1 for almost all two or more word queries, except for a very small number of results for which there is no link that passed the quota, and the text also failed to pass the quota."
Authors: ["gulin", "leo"]
Responsibles: "pavelgur"
}
Factor {
Index: 4
CppName: "FI_TEXT_RELEV_ALL_WORDS"
Name: "TRp1"
Group: "LegacyTR"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_BINARY, TG_REARR_USE, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_NN_OVER_FEATURES_USE]
Description: "Priority "Strict" for TR - text priority - all query words are somewhere in the document (subject to the context constraints of the query, such as both words must be in the same sentence)."
Authors: ["denplusplus", "gulin", "leo"]
Responsibles: ["alsafr", "gulin", "leo"]
}
Factor {
Index: 5
CppName: "FI_TEXT_RELEV_PHRASE"
Name: "TRp2"
Group: "LegacyTR"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_BINARY, TG_REARR_USE, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_REARR_USE, TG_NN_OVER_FEATURES_USE]
Description: "Priority "Phrase" for TR - text priority - all query words mentioned in a row in the document."
Authors: ["denplusplus", "gulin", "leo"]
Responsibles: ["alsafr", "gulin", "leo"]
}
Factor {
Index: 6
CppName: "FI_LINK_RELEV_ALL_WORDS"
Name: "LRp1"
Group: "Dynamic"
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: "(Strict) all query words are in one link."
Authors: ["gulin", "leo"]
Responsibles: ["gulin", "leo"]
}
Factor {
Index: 7
CppName: "FI_LINK_RELEV_PHRASE"
Name: "LRp2"
Group: "Dynamic"
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_DEPRECATED]
Description: "(phrase) all the query words mentioned in a row in one link."
Authors: ["gulin", "leo"]
Responsibles: ["gulin", "leo"]
}
Factor {
Index: 8
CppName: "FI_TEXT_RELEV_TITLE"
Name: "TRtitle"
Group: "LegacyTR"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_BINARY, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_NN_OVER_FEATURES_USE]
Description: "The presence of an exact phrase (the query text) in the header (more precisely, in the first sentence of the document). Contextual constraints and stop words are considered with the same accuracy as in TRp2, i.e. factor[8] minors factor[5]."
Authors: ["denplusplus", "gulin", "leo"]
Responsibles: ["alsafr", "gulin", "leo"]
}
Factor {
Index: 9
CppName: "FI_TEXT_RELEV_WHOLE_HR_MATCHED"
Name: "TRhr"
Group: "LegacyTR"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_BINARY, TG_REARR_USE, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_NN_OVER_FEATURES_USE]
Description: "A text that has passed the quota was found, in which all words are marked as having BEST_RELEV relevance (title or meta keywords)."
Authors: ["gulin", "leo"]
Responsibles: ["gulin", "leo"]
}
# TODO(FACTORDEL-65): replace with TG_REMOVED
Factor {
Index: 10
CppName: "FI_REMOVED_10"
Name: "Removed_10"
Tags: [TG_UNUSED]
}
Factor {
Index: 11
CppName: "FI_NEWS"
Name: "News"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/Klassificacionnye?v=tkd#h45859-3>"
Tags: [TG_HOST, TG_STATIC, TG_BINARY, TG_REARR_USE, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "This is a news website (determined by patterns in the URL (<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/Klassificacionnye?v=tkd#h45859-3>))."
Authors: "gulin"
Responsibles: "gulin"
}
Factor {
Index: 12
CppName: "FI_SHOP"
Name: "Shop"
AntiSeoUpperBound: 1.0
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/Klassificacionnye?v=tkd#h45859-4>"
Tags: [TG_HOST, TG_STATIC, TG_BINARY, TG_DEPRECATED, TG_OFTEN_ZERO]
Description: "This is a shop (determined by patterns in the URL (<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/Klassificacionnye?v=tkd#h45859-4>). Deprecated"
Authors: "gulin"
Responsibles: "gulin"
}
Factor {
Index: 13
CppName: "FI_CATALOG"
Name: "Cat"
AntiSeoUpperBound: 1.0
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/Klassificacionnye?v=tkd#h45859-2>"
Tags: [TG_HOST, TG_STATIC, TG_BINARY, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "This is a catalog (determined by patterns in the URL (<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/Klassificacionnye?v=tkd#h45859-2>) or the Yandex catalog)."
Authors: "gulin"
Responsibles: "gulin"
}
Factor {
Index: 14
CppName: "FI_YA_BAR"
Name: "YaBar"
AntiSeoUpperBound: 1.0
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/YaBar>"
Tags: [TG_BROWSER, TG_HOST, TG_STATIC, TG_USER, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_VISITS_ACTIVITY_DOWNLOADS, TG_USERFEAT]
Description: "Traffic from Yandex Bar. The factor is remapped."
Authors: ["kostyagin", "somov"]
Responsibles: ["tarum", "niknik"]
}
Factor {
Index: 15
CppName: "FI_LONG"
Name: "Long"
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_REARR_USE, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "A long document (the longer the document, the greater the value of the factor)."
Authors: "gulin"
Responsibles: "gulin"
}
Factor {
Index: 16
CppName: "FI_HIT_WEIGHT"
Name: "TRhitw"
Group: "LegacyTR"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_REARR_USE, TG_NN_OVER_FEATURES_USE]
Description: "Hitweigt is a variant of textual relevance in which the weights of all hits are considered equal (i.e., they do not take into account the premiums for title and word proximit). At the same time, the corresponding hits must pass the restrictions of the syntactic Sorcerer (algorithm name), i.e. we can assume that the TRhitw factor is equal to 0 then, and only then, when SoftAndOk is equal to 0"
Authors: ["gulin", "leo"]
Responsibles: ["gulin", "leo"]
}
Factor {
Index: 17
CppName: "FI_LONG_QUERY"
Name: "LongQuery"
Group: "Query"
Tags: [TG_QUERY_ONLY, TG_DYNAMIC, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_L3_OVERWRITE, TG_NN_OVER_FEATURES_USE]
Description: "The sum of the idf of words in the query. The name does not reflect the essence: for example, for the query 'Gadyach' this factor will be greater than for the query 'Moscow Peter Ekaterinburg Samara'."
Authors: "gulin"
Responsibles: "gulin"
}
Factor {
Index: 18
CppName: "FI_PURE_TEXT"
Name: "PureText"
Tags: [TG_BINARY, TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_REARR_USE, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Wiki: "<http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/LongText>"
Description: "A long text without links."
Authors: "leo"
Responsibles: ["tsimkha", "leo"]
}
Factor {
Index: 19
CppName: "FI_ROOT"
Name: "Root"
AntiSeoUpperBound: 1.0
Tags: [TG_BINARY, TG_DOC, TG_STATIC, TG_REARR_USE, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Wiki: "<http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/Root>"
Description: "It's a homepage."
Authors: "gulin"
Responsibles: ["gulin", "tsimkha"]
}
# TODO(FACTORDEL-97): replace with TG_REMOVED, TG_REUSABLE and remove old formulas
Factor {
Index: 20
CppName: "FI_REMOVED_20"
Name: "Removed20"
Tags: [TG_UNUSED]
}
# TODO(FACTORDEL-97): replace with TG_REMOVED, TG_REUSABLE and remove old formulas
Factor {
Index: 21
CppName: "FI_REMOVED_21"
Name: "Removed21"
Tags: [TG_UNUSED]
}
Factor {
Index: 22
CppName: "FI_GEO"
Name: "Geo"
Tags: [TG_DYNAMIC, TG_LOCALIZED_COUNTRY, TG_HOST, TG_BINARY, TG_DEPRECATED, TG_UNDOCUMENTED, TG_OFTEN_ZERO]
Description: "There is a match between the user's region and the site at the country level. Binary factor: 1-matches, 0-no. Based on ((<http://wiki.yandex-team.ru/ЯндексПоиск/КлассификацияСайтовИСтраниц/Географическая/ИспользованиеВПоиске> геоклассификации сайтов))"
Authors: ["ark-kum", "gulin", "maslov"]
Responsibles: ["ark-kum", "gulin", "maslov"]
}
Factor {
Index: 23
CppName: "FI_SUBQUERY_THEME_MATCH"
Name: "SubqueryThMatch"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_THEME_CLASSIF, TG_UNDOCUMENTED, TG_L2, TG_DEPRECATED]
Description: "The topic of the query and the document are matching. The topic of the request - the work result ((<http://wiki.yandex-team.ru/EvgenijjKroxalev/subquery> правила колдунщика SubquerySearch )) The subject of the document is taken from the Yandex catalog"
Authors: ["abokov", "ekrokhalev", "gulin"]
Responsibles: ["gulin", "lamo"]
}
Factor {
Index: 24
CppName: "FI_SR"
Name: "SR"
Tags: [TG_DOC, TG_STATIC, TG_TRANS, TG_UNDOCUMENTED, TG_UNUSED]
Description: "Complex static rank, calculated based on static components using a separate formula ((<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/#oftnd1> *))."
Authors: ["gulin", "somov"]
Responsibles: ["gulin", "somov"]
}
Factor {
Index: 25
CppName: "FI_REFINES"
Name: "TRref"
Group: "LegacyTR"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_NN_OVER_FEATURES_USE]
Description: "The factor about the "refines" number. The query language has a feature "user refines" ('a word preceded by a percent sign'). By design, this means something like 'it would be nice if there was a word in the document'. The only known ((<http://staff.yandex-team.ru/gulin> Андрей Гулин)) valuable use of this feature is the query [%official %website CompanyName]. This feature is unknown to users, because it's not described in any documentation. It is planned that it will disappear from the query language, but the words with USER_REFINE priority will remain in the sorcerer (algorithm name). The factor indicates how many USER_REFINE words maximum were simultaneously encountered within a single hit in the quorum. It is believed that there are from 0 to 3 words (if > 3, then it is considered as 3). This number is mapped into the interval [0,1)"
Authors: ["gulin", "leo"]
Responsibles: ["gulin", "leo"]
}
Factor {
Index: 26
CppName: "FI_TR_BOOST"
Name: "TRboost"
Group: "Dynamic"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_NN_OVER_FEATURES_USE]
Description: "The number by which some link factors are multiplied (namely, factors number 6, 7, 47, 66), if the text relevance is 0, and there are just a few links"
Authors: "gulin"
Responsibles: "gulin"
}
Factor {
Index: 27
CppName: "FI_TRLR_LEMMA"
Name: "TRLRlemma"
Group: "Dynamic"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_NN_OVER_FEATURES_USE]
Description: "Lemma coincides in textual relevance."
Authors: ["gulin", "leo"]
Responsibles: ["gulin", "leo"]
}
Factor {
Index: 28
CppName: "FI_TRAFGRAPH_OUT_ALL_SHARE_D"
Name: "TrafgraphOutAll_share_d"
Tags: [TG_OWNER, TG_STATIC, TG_OFTEN_ZERO, TG_COMMERCIAL, TG_NN_OVER_FEATURES_USE]
Description: "Remapped mascot feature TrafgraphOutAll_share_d"
Ticket: "SEARCHSPAM-15531"
Authors: ["bikulov"]
Responsibles: ["bikulov", "sdormidontov"]
ImplementationTime: "2020-09-30"
}
Factor {
Index: 29
CppName: "FI_RELEV_SENTS_DSSM"
Name: "RelevSentsDssm"
Tags: [TG_DYNAMIC, TG_DOC, TG_DOC_TEXT, TG_NEURAL, TG_NN_OVER_FEATURES_USE]
Description: "Dssm model, trained to reformulate, uses sentences relevant to the query in the document part"
UseArtifact: {Name: "DssmRelevSents"}
Ticket: "FACTOR-2259"
Authors: ["padese"]
Responsibles: ["padese"]
ImplementationTime: "2020-03-03"
}
Factor {
Index: 30
CppName: "FI_FRESH_NEWS_DETECTOR_PREDICT"
Name: "FreshNewsDetectorPredict"
Ticket: "WEBFRESH-478"
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_USER, TG_FRESHNESS_USE, TG_L2, TG_QUERY_DETECTOR_PREDICT, TG_UNUSED, TG_NOT_01]
Description: "The value of the news detector calculated in the Hippopotamus (name of the algorithm). Always 0 when the detector value is lower than the limit."
Authors: ["alejes", "hygge"]
Responsibles: ["alejes", "hygge"]
MinValue: -3e+38
MaxValue: 3e+38
ImplementationTime: "2020-09-27"
}
Factor {
Index: 31
CppName: "FI_HIT_NUM_100"
Name: "LRHitNum100"
Group: "LegacyLR"
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: "The converted number of words in the query in all url links."
Authors: "leshch"
Responsibles: "alsafr"
}
Factor {
Index: 32
CppName: "FI_HIT_NUM_GT_16"
Name: "LRHitNumGt16"
Group: "LegacyLR"
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_BINARY, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: "The document LR>20 if it has the number of query words in links> 16, the pro LR factor."
Authors: "leshch"
Responsibles: "alsafr"
}
Factor {
Index: 33
CppName: "FI_PCT_LINKS"
Name: "PctLinks"
Group: "LegacyLR"
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: "For documents with high LR - normalized link relevance without proximity, for documents with low LR 0"
Authors: "leshch"
Responsibles: "alsafr"
}
Factor {
Index: 34
CppName: "FI_HAS_LR"
Name: "HasLR"
Group: "LegacyLR"
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_BINARY, TG_REARR_USE, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_DEPRECATED]
Description: "Url has a high LR."
Authors: "denplusplus"
Responsibles: "alsafr"
}
Factor {
Index: 35
CppName: "FI_LINK_QUALITY"
Name: "LinkQuality"
Tags: [TG_DOC, TG_LINK_TEXT, TG_STATIC, TG_DEPRECATED, TG_L2]
Description: "Quality of incoming links (Leschiner classifier) - broken, see [405]"
Authors: "leshch"
Responsibles: "alsafr"
}
Factor {
Index: 36
CppName: "FI_ALICE_MUSIC_TRACK_TITLE_COSINE_MATCH_MAX_PREDICTION"
Name: "AliceMusicTrackTitleCosineMatchMaxPrediction"
Tags: [TG_UNUSED, TG_DYNAMIC, TG_DOC, TG_ALICE_MUSIC, TG_ANNOTATION_NOFILTER, TG_TEXT_MACHINE, TG_ALLOW_USE_FOR_ALICE]
Description: "The value of CosineMatchMaxPrediction for the stream AliceMusic"
Wiki: "<https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/lingboost>"
Ticket: ["BUKI-2932"]
Authors: "anrodigina"
Responsibles: ["anrodigina", "gotmanov", "hommforever"]
ImplementationTime: "2020-03-11"
}
Factor {
Index: 37
CppName: "FI_NUM_LINKS"
Name: "NumLinks"
Wiki: "<http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/NumLinks>"
Tags: [TG_DOC, TG_LINK_GRAPH, TG_STATIC, TG_L2, TG_UNUSED]
Description: "The number of incoming links. Remapping."
Responsibles: ["tsimkha", "alsafr"]
}
Factor {
Index: 38
CppName: "FI_POPULAR_Q"
Name: "PopularQ"
DependsOn: [{Feature: ["PopularQ"], Slice: "begemot_query_factors"}]
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_REARR_USE, TG_L2, TG_DEPRECATED]
Group: "Query"
Description: "Request popularity."
Wiki: "<http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/PopularQ>"
Authors: "denplusplus"
Responsibles: ["diver", "akhropov"]
}
Factor {
Index: 39
CppName: "FI_TR_UNMAPPED"
Name: "TRUnmapped"
Group: "LegacyTR"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_NN_OVER_FEATURES_USE]
Description: "TR divided by the cube of the number of words in the query and converted by the standard remapTR."
Authors: ["denplusplus", "gulin"]
Responsibles: ["alsafr", "gulin"]
}
Factor {
Index: 40
CppName: "FI_RUS_LANG"
Name: "RusLang"
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_BINARY, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "Document language - Russian."
Authors: ["aalekseev", "denplusplus"]
Responsibles: "alsafr"
}
Factor {
Index: 41
CppName: "FI_ADD_TIME"
Name: "AddTime"
Tags: [TG_DATE, TG_DOC, TG_STATIC, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The time when the page was added, the older the document the higher the number; the root of the time is taken, mapped to the interval [0,1] so that 3+ years results in 1."
Authors: ["aalekseev", "denplusplus"]
Responsibles: "alsafr"
}
Factor {
Index: 42
CppName: "FI_IS_MAIN_PAGE"
Name: "IsMainPage"
Tags: [TG_DOC, TG_STATIC, TG_BINARY, TG_REARR_USE, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "If it's the homepage of the owner (most often a second-level domain, for example xxxx.ru), then the factor is 1. For free platforms, hostings, personal blogs, etc. (for example, lifejournal, narod.ru, etc.) - third-level domains (such as xxxxx.narod.ru) will also have a factor equal to 1."
Authors: ["aalekseev", "denplusplus"]
Responsibles: "alsafr"
}
Factor {
Index: 43
CppName: "FI_ADD_TIME_MP"
Name: "AddTimeMP"
AntiSeoUpperBound: 1.0
Tags: [TG_DATE, TG_HOST, TG_STATIC, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The time of when the homepage of the owner (host?) was added. It is remapped in the same way as AddTime."
Authors: ["aalekseev", "denplusplus"]
Responsibles: "alsafr"
}
Factor {
Index: 44
CppName: "FI_ALICE_MUSIC_TRACK_TITLE_ANNOTATION_MAX_VALUE_WEIGHTED"
Name: "AliceMusicTrackTitleAnnotationMaxValueWeighted"
Tags: [TG_UNUSED, TG_DYNAMIC, TG_DOC, TG_ALICE_MUSIC, TG_ANNOTATION_NOFILTER, TG_TEXT_MACHINE, TG_ALLOW_USE_FOR_ALICE]
Description: "AnnotationMaxValueWeighted factor value for AliceMusic stream"
Wiki: "<https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/lingboost>"
Ticket: ["BUKI-2932"]
Authors: "anrodigina"
Responsibles: ["anrodigina", "gotmanov", "hommforever"]
ImplementationTime: "2020-03-11"
}
Factor {
Index: 45
CppName: "FI_URL_CLICKS_PCTR"
Name: "QueryURLClicksPCTR"
AntiSeoUpperBound: 0.6
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_REARR_USE, TG_OFTEN_ZERO, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_CLICKS_SHOWS, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Countries: CNT_RELEV
Description: "How often a given URL is clicked for a given query - CTR multiplied by a correction coefficient"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/Клики#queryurldownerclickspctrfrccomboreg>"
Authors: ["akhropov", "solar"]
Responsibles: ["tarum", "niknik"]
}
Factor {
Index: 46
CppName: "FI_TEXT_BM25"
Name: "TextBM25"
Group: "TextBM25"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "Simple BM25 according to the text."
Authors: "gulin"
Responsibles: "gulin"
}
Factor {
Index: 47
CppName: "FI_LINK_BM25"
Name: "LinkBM25"
Group: ["LinkBM25", "Dynamic"]
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_DEPRECATED]
Description: "A simple BM25 of links; link weights are not taken into account."
Authors: "gulin"
Responsibles: "gulin"
}
Factor {
Index: 48
CppName: "FI_TLBM25"
Name: "TLBM25"
Group: "TextAndLinkBM25"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_L2, TG_DEPRECATED]
Description: "A simple BM25 of text and links together."
Authors: "gulin"
Responsibles: "gulin"
}
Factor {
Index: 49
CppName: "FI_TLP1"
Name: "TLp1"
Group: "TextAndLinkBM25"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_LINK_TEXT, TG_BINARY, TG_UNDOCUMENTED, TG_L2, TG_DEPRECATED]
Description: "All query words are mentioned in the text + links."
Authors: "gulin"
Responsibles: "gulin"
}
Factor {
Index: 50
CppName: "FI_ADV"
Name: "Adv"
Tags: [TG_OWNER, TG_STATIC, TG_BINARY, TG_DEPRECATED, TG_OFTEN_ZERO]
Description: "The website contains ads."
Authors: ["aalekseev", "denplusplus"]
Responsibles: ["sisoid", "alsafr"]
}
Factor {
Index: 51
CppName: "FI_YANDEX_ADV"
Name: "YandexAdv"
AntiSeoUpperBound: 1.0
Tags: [TG_OWNER, TG_STATIC, TG_BINARY, TG_REARR_USE, TG_DEPRECATED, TG_OFTEN_ZERO]
Description: "The website contains Yandex ads."
Authors: ["aalekseev", "denplusplus"]
Responsibles: ["sisoid", "alsafr"]
}
Factor {
Index: 52
CppName: "FI_NO_SPAM"
Name: "NoSpam"
AntiSeoUpperBound: 1.0
Tags: [TG_OWNER, TG_STATIC, TG_THEME_CLASSIF, TG_REARR_USE, TG_DEPRECATED]
Description: "The spam classifier by antispam features recognized the site as NOT(!) spam. I.e. 0=spam, 1=good."
Authors: ["aalekseev", "denplusplus"]
Responsibles: "alsafr"
}
Factor {
Index: 53
CppName: "FI_TEXT_PAIR"
Name: "TxtPair"
Group: "TextBM25"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "A simple BM25 of word pairs - we take all pairs of query words and count the number of their usage in the document text. As the weight of the pair, we use the sum of the weights of the words. Comm doesn't work if there is a stop word in the request"
Authors: "gulin"
Responsibles: "gulin"
}
Factor {
Index: 54
CppName: "FI_LINK_PAIR"
Name: "LnkPair"
Group: "LinkBM25"
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_L2, TG_DEPRECATED]
Description: "It's the same as TxtPair but for links; link weights are not taken into account."
Authors: "gulin"
Responsibles: "gulin"
}
Factor {
Index: 55
CppName: "FI_TEXT_BREAK"
Name: "TxtBreak"
Group: "TextBM25"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The BM25 of the number of sentences in the document in which it occurs."
Authors: "gulin"
Responsibles: "gulin"
}
Factor {
Index: 56
CppName: "FI_TEXT_HEAD"
Name: "TxtHead"
Group: "TextBM25"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The BM25 of words that are used in the heading only."
Authors: "gulin"
Responsibles: "gulin"
}
Factor {
Index: 57
CppName: "FI_TEXT_HI_RELEV"
Name: "TxtHiRel"
Group: "TextBM25"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The BM25 of words with only high rel-beats ('significant', with emphasis (<b> etc))."
Authors: "gulin"
Responsibles: "gulin"
}
# TODO(FACTORDEL-97): replace with TG_REMOVED, TG_REUSABLE and remove old formulas
Factor {
Index: 58
CppName: "FI_REMOVED_58"
Name: "Removed_58"
Tags: [TG_UNUSED]
}
Factor {
Index: 59
CppName: "FI_WORD_COUNT"
Name: "WordCount"
Group: "Query"
Tags: [TG_QUERY_ONLY, TG_DYNAMIC, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "Min(number of query words/10, 1.f)"
Authors: ["denplusplus", "gulin"]
Responsibles: ["alsafr", "gulin"]
}
Factor {
Index: 60
CppName: "FI_INV_WORD_COUNT"
Name: "InvWordCount"
Group: "Query"
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "1 / number_of_words_in_the_query."
Authors: ["denplusplus", "gulin"]
Responsibles: ["alsafr", "gulin"]
}
Factor {
Index: 61
CppName: "FI_HAS_NO_TR"
Name: "HasNoTR"
Group: "LegacyTR"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_BINARY, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_NN_OVER_FEATURES_USE]
Description: "The document doesn't have TR."
Authors: ["denplusplus", "gulin"]
Responsibles: ["alsafr", "gulin"]
CanonicalValue: 1.0
}
Factor {
Index: 62
CppName: "FI_HAS_NO_LR"
Name: "HasNoLR"
Group: "LegacyLR"
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_BINARY, TG_REARR_USE, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_DEPRECATED]
Description: "The document doesn't have LR."
Authors: ["denplusplus", "gulin"]
Responsibles: ["gulin", "alsafr"]
CanonicalValue: 1.0
}
Factor {
Index: 63
CppName: "FI_HAS_NO_QUERY_URL_SHOWS"
Name: "HasNoQueryURLShows"
AntiSeoUpperBound: 1.0
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_BINARY, TG_REARR_USE, TG_OFTEN_ZERO, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_CLICKS_SHOWS, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Countries: CNT_RELEV
Description: "There is no clickability information of a given request's url ; 1 - the request or request url are not in the click database, 0 - the request url is in the click database"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/Клики#hasnoqueryurldownershows>"
Authors: ["denplusplus", "kostyagin"]
Responsibles: ["tarum", "niknik"]
CanonicalValue: 1.0
}
Factor {
Index: 64
CppName: "FI_HAS_NO_QUERY_SHOWS"
Name: "HasNoQueryShows"
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_USER_SEARCH_EXTERNAL, TG_BINARY, TG_REARR_USE, TG_OFTEN_ZERO, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_CLICKS_SHOWS, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Countries: CNT_RELEV
Description: "There is no information about clickability of this request; 1 - the request is not in the click database, 0 - the request is in the click database."
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/Клики#hasnoqueryshows>"
Authors: ["denplusplus", "kostyagin", "akhropov"]
Responsibles: ["tarum", "niknik"]
CanonicalValue: 1.0
}
Factor {
Index: 65
CppName: "FI_HOPS"
Name: "Hops"
Tags: [TG_DOC, TG_STATIC, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The number of url hops in the bypass (such as - the closer to the homepage (slang), the lower the value (0 - homepage, 1- it's impossible to get here from the homepage (slang), 0 < it's possible to get here from homepage (slang) < 1). The normal value for root node is 0.0039)."
Authors: "denplusplus"
Responsibles: "alsafr"
}
Factor {
Index: 66
CppName: "FI_LOG_LR"
Name: "LogLR"
AntiSeoUpperBound: 0.85
Group: "Dynamic"
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_DEPRECATED]
Description: "The logarithm of LR mapped linearly to [0,1]."
Authors: ["denplusplus", "karpik"]
Responsibles: "alsafr"
}
Factor {
Index: 67
CppName: "FI_TEXT_PAIR_EX"
Name: "TxtPairEx"
Group: "TextBM25"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "the presence of pairs of words in the exact form"
Responsibles: "alsafr"
}
Factor {
Index: 68
CppName: "FI_TEXT_BREAK_EX"
Name: "TxtBreakEx"
Group: "TextBM25"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "the number of sentences that contain many words in the exact form"
Responsibles: "alsafr"
}
Factor {
Index: 69
CppName: "FI_TEXT_HEAD_EX"
Name: "TxtHeadEx"
Group: "TextBM25"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "the presence of words in the title in the exact form"
Responsibles: "alsafr"
}
Factor {
Index: 70
CppName: "FI_TEXT_HI_RELEV_EX"
Name: "TxtHiRelEx"
Group: "TextBM25"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "BM25 as the exact number"
Responsibles: "alsafr"
}
Factor {
Index: 71
CppName: "FI_TEXT_BM25_EX"
Name: "TxtBm25Ex"
Group: "TextBM25"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "A simple BM25 as the exact number."
Responsibles: "alsafr"
}
Factor {
Index: 72
CppName: "FI_TEXT_PAIR_SYN"
Name: "TxtPairSy"
Group: "TextBM25"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "the presence of pairs of words while taking synonyms into account (>=TxtPair)"
Responsibles: "alsafr"
}
Factor {
Index: 73
CppName: "FI_TEXT_BRAEK_SYN"
Name: "TxtBreakSy"
Group: "TextBM25"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "the number of sentences in which many words occur including synonyms"
Responsibles: "alsafr"
}
Factor {
Index: 74
CppName: "FI_TEXT_HEAD_SYN"
Name: "TxtHeadSy"
Group: "TextBM25"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_L2, TG_REARR_USE, TG_NN_OVER_FEATURES_USE]
Description: "the presence of words in the title, including synonyms"
Responsibles: "alsafr"
}
Factor {
Index: 75
CppName: "FI_TEXT_HI_RELEV_SYN"
Name: "TxtHiRelSy"
Group: "TextBM25"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "BM25 including synonyms"
Responsibles: "alsafr"
}
Factor {
Index: 76
CppName: "FI_TEXT_BM25_SYN"
Name: "TxtBm25Sy"
Group: "TextBM25"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "A simple BM25 including synonyms."
Responsibles: "alsafr"
}
Factor {
Index: 77
CppName: "FI_QUERY_DOWNER_CLICKS_PCTR"
Name: "QueryDOwnerClicksPCTR"
Tags: [TG_DYNAMIC, TG_DOWNER, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_USER_SEARCH_EXTERNAL, TG_REARR_USE, TG_OFTEN_ZERO, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_CLICKS_SHOWS, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Countries: CNT_RELEV
Description: "How often people click on the URLs of a given domainId for a given query - CTR domainId multiplied by a correction coefficient"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/Клики#queryurldownerclickspctrfrccomboreg>"
Authors: ["akhropov", "solar", "denplusplus"]
Responsibles: ["tarum", "niknik"]
}
Factor {
Index: 78
CppName: "FI_HAS_NO_QUERY_DOWNER_SHOWS"
Name: "HasNoQueryDOwnerShows"
Tags: [TG_DYNAMIC, TG_DOWNER, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_USER_SEARCH_EXTERNAL, TG_BINARY, TG_OFTEN_ZERO, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_CLICKS_SHOWS, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Countries: CNT_RELEV
Description: "There is no clickability information for the given domainId for this query; 1 - the query or query-owner is not in the click database, 0 - the query-owner is in the click database"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/Клики#hasnoqueryurldownershows>"
Authors: ["denplusplus", "kostyagin"]
Responsibles: ["tarum", "niknik"]
CanonicalValue: 1.0
}
Factor {
Index: 79
CppName: "FI_OWNER_CLICKS_PCTR"
Name: "OwnerClicksPCTR"
Tags: [TG_STATIC, TG_OWNER, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_OFTEN_ZERO, TG_L2, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_CLICKS_SHOWS, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Description: "The clickability of the owner regardless of the query"
Wiki: "<http://wiki.yandex-team.ru/ЯндексПоиск/КачествоПоиска/Клики#ownerclickspctrreg>"
Authors: ["akhropov", "maslov"]
Responsibles: ["tarum", "niknik"]
}
Factor {
Index: 80
CppName: "FI_MEGAFON"
Name: "Megafon"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_LINK_TEXT, TG_UNUSED]
Description: "The relative frequency of query words in links (1 - the query words are often found in links, 0.3 - the are rarely found); to be more precise, the value of this factor is decreased under the condition: TR=0 && LR=0 && (there is no link with all query words) && (it did not pass the quota) && (at least one pair of query words occurs in the text)"
Responsibles: "alsafr"
}
Factor {
Index: 81
CppName: "FI_HAS_ALL_WORDS_MERGED"
Name: "XLRp0"
Group: "Xref"
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_BINARY, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_DEPRECATED]
Description: "The links contain all query words"
Responsibles: "alsafr"
}
Factor {
Index: 82
CppName: "FI_HAS_ALL_WORDS_IN_LINK"
Name: "XLRp1"
Group: "Xref"
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_BINARY, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_DEPRECATED]
Description: "One link has all query words"
Responsibles: "alsafr"
}
Factor {
Index: 83
CppName: "FI_PHRASE"
Name: "XLRp2"
Group: "Xref"
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_BINARY, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_DEPRECATED]
Description: "There is a link that passed the quota"
Responsibles: "alsafr"
}
Factor {
Index: 84
CppName: "FI_GOOD_RATIO"
Name: "XLRgood"
Group: "Xref"
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_REARR_USE, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: "What percentage of links are “good”?"
Responsibles: "alsafr"
}
Factor {
Index: 85
CppName: "FI_MANY_BAD"
Name: "XLRmanyBad"
AntiSeoUpperBound: 1.0
Group: "Xref"
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_DEPRECATED]
Description: "How many "bad" links are there (bad= dpr = 0)"
Responsibles: "alsafr"
}
Factor {
Index: 86
CppName: "FI_LR_MAX_DPR"
Name: "XLRmaxDpr"
Group: "Xref"
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_DEPRECATED]
Description: "The maximum dpr of the links"
Responsibles: "alsafr"
}
Factor {
Index: 87
CppName: "FI_LR_TF_IDF"
Name: "XLRtfidf"
Group: "Xref"
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: "The regular TfIdf TF*IDF of links. The word frequency in links is multiplied by the inverse document frequency and is summed over all words, then it's adapted to the length of the document."
Responsibles: "alsafr"
}
Factor {
Index: 88
CppName: "FI_LR_RELEV"
Name: "XLRrelev"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/OpisanijaFaktorov#h20931-2>"
Group: "Xref"
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: "The link relevance from Gulin"
Authors: "gulin"
Responsibles: "gulin"
}
Factor {
Index: 89
CppName: "FI_LR_RELEV_200"
Name: "XLRrelev200"
Group: "Xref"
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: "The link relevance from Gulin"
Authors: "gulin"
Responsibles: "gulin"
}
Factor {
Index: 90
CppName: "FI_LR_LOG_RELEV"
Name: "XLRlogRelev"
Group: "Xref"
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: "The link relevance from Gulin"
Authors: "gulin"
Responsibles: "gulin"
}
Factor {
Index: 91
CppName: "FI_BF_EXACT"
Name: "BFexact"
Group: "BestForm"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_LINK_TEXT, TG_BINARY, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: "There is an exact form of all query words in text/links"
Responsibles: "alsafr"
}
Factor {
Index: 92
CppName: "FI_BF_LEMMA"
Name: "BFlemma"
Group: "BestForm"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_LINK_TEXT, TG_BINARY, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: "There is a lemma of all query words in text/links"
Responsibles: "alsafr"
}
Factor {
Index: 93
CppName: "FI_SOFT_AND_OK"
Name: "SoftAndOk"
Group: "Dynamic"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_BINARY, TG_UNDOCUMENTED, TG_NN_OVER_FEATURES_USE]
Description: "The document passed softand on the constraints of the syntactic Sorcerer (algorithm name). It's only for documents that have textual relevance. For single-word queries, it's always 1."
Responsibles: "alsafr"
}
Factor {
Index: 94
CppName: "FI_NEW_LINK_QUALITY"
Name: "NewLinkQuality"
Tags: [TG_DOC, TG_LINK_GRAPH, TG_STATIC, TG_DEPRECATED]
Description: "The inbound link quality classifier 2 is broken, see [407]"
Responsibles: "alsafr"
}
Factor {
Index: 95
CppName: "FI_UKR"
Name: "Ukrainian"
Tags: [TG_STATIC_REGINFO, TG_HOST, TG_STATIC, TG_BINARY, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "It equals 1 if the website has a Ukrainian geo-attribute (i.e. 1 - Ukrainian website)"
Responsibles: "alsafr"
}
Factor {
Index: 96
CppName: "FI_IS_BLOG"
Name: "IsBlog"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/Klassificacionnye?v=tkd#h45859-5>"
Tags: [TG_HOST, TG_STATIC, TG_BINARY, TG_REARR_USE, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "It's a blog hosting page"
Authors: ["burmisha", "zudina"]
Responsibles: ["burmisha", "zudina"]
}
Factor {
Index: 97
CppName: "FI_IS_LJ"
Name: "IsLivejournal"
Tags: [TG_HOST, TG_STATIC, TG_BINARY, TG_REARR_USE, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "It's a livejournal.com page"
Responsibles: "alsafr"
}
# TODO(FACTORDEL-56): replace with TG_REMOVED
Factor {
Index: 98
CppName: "FI_REMOVED_98"
Name: "Removed_98"
Tags: [TG_UNUSED]
}
Factor {
Index: 99
CppName: "FI_SPAM2"
Name: "Spam2"
AntiSeoUpperBound: 1.0
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/OpisanijaFaktorov#h20931-3>"
Tags: [TG_OWNER, TG_STATIC, TG_THEME_CLASSIF, TG_DEPRECATED]
Description: "The automatic spam classifier named after Alekseev; there's a probability that this is a spam website (0 is not spam, 1 is spam)"
Authors: "abv"
Responsibles: "abv"
}
Factor {
Index: 100
CppName: "FI_TEXT_FEATURES"
Name: "TextFeatures"
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The quality of the text. It is calculated by using a very complex formula"
Responsibles: "alsafr"
Factor {
Index: 101
CppName: "FI_TEXT_LIKE"
Name: "TextLike"
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The quality of the text (Alekseev classifier)"
Responsibles: "alsafr"
}
# TODO(FACTORDEL-56): replace with TG_REMOVED
Factor {
Index: 102
CppName: "FI_REMOVED_102"
Name: "Removed_102"
Tags: [TG_UNUSED]
}
# TODO(FACTORDEL-56): replace with TG_REMOVED
Factor {
Index: 103
CppName: "FI_REMOVED_103"
Name: "Removed_103"
Tags: [TG_UNUSED]
}
Factor {
Index: 104
CppName: "FI_YABAR_CORE_OWNER"
Name: "YaBarCoreOwner"
Tags: [TG_STATIC, TG_OWNER, TG_USER, TG_BROWSER, TG_L2, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_VISITS_ACTIVITY_DOWNLOADS]
Description: "The core of the owners' audience according to Yandex.Browsing"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/userbrowsingactions/coreaudience/>"
Authors: "monster"
Responsibles: ["tarum", "niknik"]
}
Factor {
Index: 105
CppName: "FI_YABAR_CORE_HOST"
Name: "YaBarCoreHost"
Tags: [TG_STATIC, TG_HOST, TG_USER, TG_BROWSER, TG_REARR_USE, TG_L2, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_VISITS_ACTIVITY_DOWNLOADS]
Description: "The core of the hosts' audience according to Yandex.Browsing"
Authors: "kostyagin"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/userbrowsingactions/coreaudience/>"
Responsibles: ["tarum", "niknik"]
}
Factor {
Index: 106
CppName: "FI_HAS_YA_BAR_CORE"
Name: "HasYaBarCore"
AntiSeoUpperBound: 1.0
Tags: [TG_STATIC, TG_HOST, TG_USER, TG_BROWSER, TG_BINARY, TG_OFTEN_ZERO, TG_L2, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_VISITS_ACTIVITY_DOWNLOADS]
Description: "Does the host have a core?"
Authors: "kostyagin"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/userbrowsingactions/coreaudience/>"
Responsibles: ["tarum", "niknik"]
}
Factor {
Index: 107
CppName: "FI_SPAM_KARMA"
Name: "SpamKarma"
AntiSeoUpperBound: 1.0
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/OpisanijaFaktorov#h20931-4>"
Tags: [TG_OWNER, TG_STATIC, TG_DEPRECATED, TG_OFTEN_ZERO]
Description: "The spam karma by antispammers is a probability of the host being a spam; it's based on the information whois"
Authors: "abv"
Responsibles: "abv"
}
Factor {
Index: 108
CppName: "FI_MUSIC_Q"
Name: "MusicQ"
DependsOn: [{Feature: ["MusicQ"], Slice: "begemot_query_factors"}]
Group: "Query"
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_BINARY, TG_REARR_USE, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_DEPRECATED]
Description: "The request's musicality. The results of the work of Anton Konygin's Sorcerer (algorithm name)."
Responsibles: "alsafr"
UseArtifact: {Name: "MusicWizardClassificator"}
}
Factor {
Index: 109
CppName: "FI_EXACT_MATCHES"
Name: "XLExactMatches"
Group: "Xref"
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: "The number of links that match the query exactly"
Responsibles: "alsafr"
}
Factor {
Index: 110
CppName: "FI_DOC_LEN"
Name: "DocLen"
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The document length in sentences"
Responsibles: "alsafr"
}
Factor {
Index: 111
CppName: "FI_URL_LEN"
Name: "UrlLen"
AntiSeoUpperBound: 1.0
Tags: [TG_DOC, TG_STATIC, TG_URL_TEXT, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The URL length divided by 5"
Responsibles: "alsafr"
}
Factor {
Index: 112
CppName: "FI_QUERY_NON_COMMERCIALITY"
Name: "QueryNonCommerciality"
DependsOn: [{Feature: ["QueryNonCommerciality"], Slice: "begemot_query_factors"}]
Group: "Query"
Tags: [TG_COMMERCIAL, TG_DYNAMIC, TG_QUERY_ONLY, TG_REARR_USE, TG_OFTEN_ZERO, TG_L2, TG_DEPRECATED]
Description: "The level of being a commercial query using a phrase dictionary from Direct: 0 - maximum (commercial query), 1 - minimal (non-commercial query)."
Wiki: "<https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/QueryNonCommerciality>"
Ticket: "SEARCHSPAM-7504"
Authors: "somov"
Responsibles: ["sisoid", "anelyubin"]
}
Factor {
Index: 113
CppName: "FI_HOST_SIZE"
Name: "HostSize"
AntiSeoUpperBound: 1.0
Tags: [TG_HOST, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The size of the Raskovalov host in documents excluding duplicates (each duplicate is accounted for in the factor as an independent document)"
Authors: "denplusplus"
Responsibles: "alsafr"
}
Factor {
Index: 114
CppName: "FI_IS_HTML"
Name: "IsHTML"
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_BINARY, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "Document type - HTML"
Responsibles: "alsafr"
}
Factor {
Index: 115
CppName: "FI_LINK_SPEED"
Name: "LinkSpeed"
AntiSeoUpperBound: 1.0
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/OpisanijaFaktorov#h20931-4>"
Group: "Xref"
Tags: [TG_DATE, TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: "The reciprocal of the variance of the times of appearance of links with query words. In other words, how often do links with query words pointing out to the website appear (link velocity) "
Responsibles: "alsafr"
}
Factor {
Index: 116
CppName: "FI_TH_LR_RELEV"
Name: "XThLRrelev"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/OpisanijaFaktorov#h20931-5>"
Group: "Xref"
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_THEME_CLASSIF, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: "The link relevance based on theme"
Responsibles: "alsafr"
}
Factor {
Index: 117
CppName: "FI_TH_LR_RELEV_200"
Name: "XThLRrelev200"
Group: "Xref"
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_THEME_CLASSIF, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: "The link relevance based on theme"
Responsibles: "alsafr"
}
Factor {
Index: 118
CppName: "FI_TH_LR_LOG_RELEV"
Name: "XThLRlogRelev"
Group: "Xref"
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_THEME_CLASSIF, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: "The link relevance based on theme"
Responsibles: "alsafr"
}
Factor {
Index: 119
CppName: "FI_LERF_LR_RELEV"
Name: "XLerfLRrelev"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/OpisanijaFaktorov#h20931-8>"
Group: "Xref"
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: "The link relevance based on the quality of each link"
Responsibles: "alsafr"
}
Factor {
Index: 120
CppName: "FI_LERF_LR_RELEV_200"
Name: "XLerfLRrelev200"
Group: "Xref"
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: "The link relevance based on the quality of each link"
Responsibles: "alsafr"
}
Factor {
Index: 121
CppName: "FI_LERF_LR_LOG_RELEV"
Name: "XLerfLRlogRelev"
Group: "Xref"
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: "The link relevance based on the quality of each link"
Responsibles: "alsafr"
}
Factor {
Index: 122
CppName: "FI_LERF_TH_LR_LOG_RELEV"
Name: "XLerfThLRlogRelev"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/OpisanijaFaktorov#h20931-11>"
Group: "Xref"
Tags: [TG_DYNAMIC, TG_LINK_TEXT, TG_THEME_CLASSIF, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: "The link relevance based on the quality and theme of each link"
Responsibles: "alsafr"
}
Factor {
Index: 123
CppName: "FI_NON_COMM_LR_LOG_RELEV"
Name: "XNonCommLRlogRelev"
AntiSeoUpperBound: 1.0
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/OpisanijaFaktorov#h20931-12>"
Group: "Xref"
Tags: [TG_COMMERCIAL, TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_REARR_USE, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: "The link relevance based on the non-commercial nature of each link"
Responsibles: "alsafr"
}
Factor {
Index: 124
CppName: "FI_NON_COMM_TH_LR_LOG_RELEV"
Name: "XNonCommThLRlogRelev"
AntiSeoUpperBound: 1.0
Group: "Xref"
Tags: [TG_COMMERCIAL, TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_THEME_CLASSIF, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: "The link relevance based on the non-commercial nature of each link and theme"
Responsibles: "alsafr"
}
Factor {
Index: 125
CppName: "FI_NON_COMM_LERF_LR_LOG_RELEV"
Name: "XNonCommLerfLRlogRelev"
AntiSeoUpperBound: 1.0
Group: "Xref"
Tags: [TG_COMMERCIAL, TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_THEME_CLASSIF, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: "The link relevance based on the non-commercial nature of each link and its quality"
Responsibles: "alsafr"
}
Factor {
Index: 126
CppName: "FI_NON_COMM_LERF_TH_LR_LOG_RELEV"
Name: "XNonCommLerfThLRlogRelev"
AntiSeoUpperBound: 1.0
Group: "Xref"
Tags: [TG_COMMERCIAL, TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_THEME_CLASSIF, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: "The link relevance based on the non-commercial nature of each link, its quality and theme"
Responsibles: "alsafr"
}
Factor {
Index: 127
CppName: "FI_GEO_CITY_PROXIM"
Name: "GeoCityProxim"
AntiSeoUpperBound: 1.0
Tags: [TG_DOC, TG_DYNAMIC, TG_LOCALIZED_GEOINQUERY, TG_BINARY, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "There is a match between the region mentioned in the query and the websites found at the region level. The binary factor: 1-there is a match, 0-there's no match. Based on ((<http://wiki.yandex-team.ru/ЯндексПоиск/КлассификацияСайтовИСтраниц/Географическая/ИспользованиеВПоиске> геоклассификации сайтов))"
Authors: "denplusplus"
Responsibles: "alsafr"
}
Factor {
Index: 128
CppName: "FI_LINKS_WITH_WORDS_PERCENT"
Name: "LinksWithWordsPercent"
Group: "Xref"
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_UNUSED]
Description: "The percentage of incoming links with query words"
Responsibles: "alsafr"
}
Factor {
Index: 129
CppName: "FI_LINKS_WITH_ALL_WORDS_PERCENT"
Name: "LinksWithAllWordsPercent"
Group: "Xref"
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_REARR_USE, TG_UNDOCUMENTED, TG_UNUSED]
Description: "The percentage of incoming links with all query words"
Responsibles: "alsafr"
}
Factor {
Index: 130
CppName: "FI_PORNO_QUERY"
Name: "PornoQuery"
DependsOn: [{Feature: ["PornoQuery"], Slice: "begemot_query_factors"}]
Group: "Query"
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_THEME_CLASSIF, TG_BINARY, TG_REARR_USE, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_DEPRECATED]
Description: "Does the query contain words from yweb/pornofilter/porno.query."
Wiki: "<http://wiki.yandex-team.ru//h.yandex.net/?https%3A%2F%2Ftree.yandex.ru%2Fcgi-bin%2Fcvsweb.cgi%2Farcadia%2Fyweb%2Fpornofilter%2Fporno.query>"
Responsibles: "alsafr"
UseArtifact: {Name: "PornoQueryList"}
}
Factor {
Index: 131
CppName: "FI_IS_PORNO"
Name: "IsPorno"
AntiSeoUpperBound: 1.0
Ticket: "BETATEST-151"
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_BINARY, TG_REARR_USE, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The document is from porn industry"
Responsibles: "abv"
}
Factor {
Index: 132
CppName: "FI_IS_COMM"
Name: "IsComm"
AntiSeoUpperBound: 1.0
Ticket: "BETATEST-151"
Tags: [TG_COMMERCIAL, TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_BINARY, TG_DEPRECATED, TG_OFTEN_ZERO, TG_L2]
Description: "It's a commercial document. It is not being used (deprecated)"
Comment: "Still used in formula and polinom :("
Responsibles: "sisoid"
}
Factor {
Index: 133
CppName: "FI_IS_FAKE"
Name: "IsFake"
AntiSeoUpperBound: 1.0
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_BINARY, TG_REARR_USE, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_NN_OVER_FEATURES_USE]
Description: "A fake document"
Responsibles: "alsafr"
}
Factor {
Index: 134
CppName: "FI_IS_SEO"
Name: "IsSEO"
AntiSeoUpperBound: 1.0
Tags: [TG_COMMERCIAL, TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_BINARY, TG_DEPRECATED, TG_OFTEN_ZERO, TG_L2]
Description: "The page heading contains commercial vocabulary. It is not being used (deprecated)"
Responsibles: "alsafr"
}
Factor {
Index: 135
CppName: "FI_IS_WIKI"
Name: "IsWiki"
AntiSeoUpperBound: 1.0
Tags: [TG_HOST, TG_STATIC, TG_WIKIPEDIA, TG_BINARY, TG_REARR_USE, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "A page from ru.wikipedia.org"
Responsibles: "alsafr"
}
Factor {
Index: 136
CppName: "FI_IS_ESHOP"
Name: "IsEShop"
AntiSeoUpperBound: 1.0
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_THEME_CLASSIF, TG_BINARY, TG_REARR_USE, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "A commercial page (Savin's classifier)"
Authors: "asavin"
Responsibles: "asavin"
}
Factor {
Index: 137
CppName: "FI_GEO_REGION_PROXIM"
Name: "GeoRegionProxim"
Tags: [TG_DOC, TG_DYNAMIC, TG_LOCALIZED_GEOINQUERY, TG_BINARY, TG_REARR_USE, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Authors: "denplusplus"
Responsibles: "alsafr"
}
Factor {
Index: 138
CppName: "FI_HAS_NO_ALL_WORDS_TR_SYN"
Name: "HasNoAllWordsTRSy"
Group: "TextBM25"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_BINARY, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The document does not contain all the query words (with an accuracy of a synonym)"
Responsibles: "alsafr"
CanonicalValue: 1.0
}
Factor {
Index: 139
CppName: "FI_NUM_WORDS_TR_SYN"
Name: "NumWordsTRSy"
Group: "TextBM25"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The percentage of query words in a document (with an accuracy of a synonym)"
Responsibles: "alsafr"
}
Factor {
Index: 140
CppName: "FI_HAS_ALL_WORDS_TR_SYN"
Name: "HasAllWordsTRSy"
Group: "TextBM25"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_BINARY, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The document contains all query words (with an accuracy of a synonym)"
Responsibles: "alsafr"
}
Factor {
Index: 141
CppName: "FI_NUM_WORDS_LR"
Name: "NumWordsLR"
Group: "LinkBM25"
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_DEPRECATED]
Description: "The percentage of query words in links (with an accuracy of a synonym)"
Responsibles: "alsafr"
}
Factor {
Index: 142
CppName: "FI_HAS_ALL_WORDS_LR"
Name: "HasAllWordsLR"
Group: "LinkBM25"
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_BINARY, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_DEPRECATED]
Description: "The links contain all query words (with an accuracy of a synonym)"
Responsibles: "alsafr"
}
Factor {
Index: 143
CppName: "FI_PAY_DETECTOR_PREDICT"
Name: "PayDetectorPredict"
Ticket: "COMMERCIAL-4"
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_USER, TG_L2, TG_QUERY_DETECTOR_PREDICT, TG_NOT_01, TG_UNUSED]
Description: "The value of the commerce detector calculated in Hippopotamus (name of the algorithm)."
MinValue: -10
MaxValue: 10
Authors: ["alejes", "hygge"]
Responsibles: ["alejes", "hygge"]
ImplementationTime: "2020-08-01"
}
Factor {
Index: 144
CppName: "FI_TEXT_INV_PAIR"
Name: "TxtInvPair"
Group: "TextBM25"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "TR on pairs of query words in reverse order"
Responsibles: "alsafr"
}
Factor {
Index: 145
CppName: "FI_LINK_INV_PAIR"
Name: "LnkInvPair"
Group: "LinkBM25"
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_L2, TG_DEPRECATED]
Description: "LR on pairs of query words in reverse order"
Responsibles: "alsafr"
}
Factor {
Index: 146
CppName: "FI_TEXT_SKIP_PAIR"
Name: "TxtSkipPair"
Group: "TextBM25"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "TR for word pairs in request through one word in texts"
Responsibles: "alsafr"
}
Factor {
Index: 147
CppName: "FI_LINK_SKIP_PAIR"
Name: "LnkSkipPair"
Group: "LinkBM25"
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_L2, TG_DEPRECATED]
Description: "LR for word pairs in request through one word in texts"
Responsibles: "alsafr"
}
Factor {
Index: 148
CppName: "FI_NUM_WORDS_TRFM"
Name: "NumWordsTRFm"
Group: "TextBM25"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The percentage of all query words in the text (with an accuracy of a form)"
Responsibles: "alsafr"
}
Factor {
Index: 149
CppName: "FI_HAS_ALL_WORDS_TRFM"
Name: "HasAllWordsTRFm"
Group: "TextBM25"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_BINARY, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The document contains all query words (with an accuracy of a form)"
Responsibles: "alsafr"
}
Factor {
Index: 150
CppName: "FI_Q_DIVERSITY"
Name: "QDiversity"
DependsOn: [{Feature: ["QDiversity"], Slice: "begemot_query_factors"}]
Group: "Query"
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_REARR_USE, TG_OFTEN_ZERO, TG_L2, TG_DEPRECATED]
Description: "The level of point centralization from which the request is made"
Wiki: "<http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/QDiversity>"
Authors: "denplusplus"
Responsibles: ["diver", "akhropov"]
}
Factor {
Index: 151
CppName: "FI_Q_BLOG"
Name: "QBlog"
DependsOn: [{Feature: ["QBlog"], Slice: "begemot_query_factors"}]
Group: "Query"
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_BINARY, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_DEPRECATED]
Description: "Does the query contain blogging vocabulary?"
Responsibles: "alsafr"
}
Factor {
Index: 152
CppName: "FI_GEO_LR_LOG_RELEV"
Name: "XGeoLRlogRelev"
AntiSeoUpperBound: 0.9
Group: "Xref"
Tags: [TG_DOC, TG_DYNAMIC, TG_LOCALIZED_COUNTRY, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: "log(LR, narrowed down to the user's country)"
Responsibles: "alsafr"
}
Factor {
Index: 153
CppName: "FI_LERF_GEO_LR_LOG_RELEV"
Name: "XLerfGeoLRlogRelev"
Group: "Xref"
Tags: [TG_DOC, TG_DYNAMIC, TG_LOCALIZED_COUNTRY, TG_LINK_TEXT, TG_REARR_USE, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: "log(LerfLR, narrowed down to the user's country)"
Responsibles: "alsafr"
}
Factor {
Index: 154
CppName: "FI_NON_COMMERCIAL_QUERY"
Name: "NonCommercialQuery"
DependsOn: [{Feature: ["NonCommercialQuery"], Slice: "begemot_query_factors"}]
Group: "Query"
Tags: [TG_COMMERCIAL, TG_DYNAMIC, TG_QUERY_ONLY, TG_BINARY, TG_REARR_USE, TG_OFTEN_ZERO, TG_L2, TG_DEPRECATED]
Description: "Binary non-commercialization query: QueryNonCommerciality > 0.965."
Wiki: "<https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/QueryNonCommerciality>"
Ticket: "SEARCHSPAM-7504"
Responsibles: ["sisoid", "anelyubin"]
}
Factor {
Index: 155
CppName: "FI_EXACT_MATCHES_MAP"
Name: "XLExactMatchesMap"
Group: "Xref"
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_DEPRECATED]
Description: "The number of links that match the query text (another remap)"
Responsibles: "alsafr"
}
Factor {
Index: 156
CppName: "FI_LERF_NORM_LR_LOG_RELEV"
Name: "XLerfNormLRlogRelev"
Group: "Xref"
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: "XLerfLRlogRelev (normalized to the sum of all links' Lerf-weights, not to the sum of their original weights)"
Responsibles: "alsafr"
}
Factor {
Index: 157
CppName: "FI_NON_COMM_NORM_LR_LOG_RELEV"
Name: "XNonCommNormLRlogRelev"
Group: "Xref"
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: "XNonCommLRlogRelev (normalized to the sum of all links' NonComm-weights, not to the sum of their original weights)"
Responsibles: "alsafr"
}
Factor {
Index: 158
CppName: "FI_NON_COMM_TH_NORM_LR_LOG_RELEV"
Name: "XNonCommThNormLRlogRelev"
Group: "Xref"
Tags: [TG_COMMERCIAL, TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: "Link relevance with taking into account the non-commercial nature of each link and theme"
Responsibles: "alsafr"
}
Factor {
Index: 159
CppName: "FI_NON_COMM_LERF_NORM_LR_LOG_RELEV"
Name: "XNonCommLerfNormLRlogRelev"
Group: "Xref"
Tags: [TG_COMMERCIAL, TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: "XNonCommLerfNormLRlogRelev (normalized to the sum of all links' NonCommLerf-weights, not to the sum of their original weights)"
Responsibles: "alsafr"
}
Factor {
Index: 160
CppName: "FI_NON_COMM_LERF_TH_NORM_LR_LOG_RELEV"
Name: "XNonCommLerfThNormLRlogRelev"
Group: "Xref"
Tags: [TG_COMMERCIAL, TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: "Link relevance with taking into account the non-commercial nature, the quality, and the theme of each link"
Responsibles: "alsafr"
}
Factor {
Index: 161
CppName: "FI_NEVASCA1"
Name: "Nevasca1"
Tags: [TG_OWNER, TG_STATIC, TG_DEPRECATED, TG_OFTEN_ZERO]
Description: "Content duplication is not found. The 'goodness' of a host (from 0 to 1) is calculated based on how many and which hosts borrow content from the given host."
Authors: "antonovvk"
Responsibles: "antonovvk"
}
Factor {
Index: 162
CppName: "FI_NEVASCA2"
Name: "Nevasca2"
Tags: [TG_OWNER, TG_STATIC, TG_DEPRECATED]
Description: "Content duplication is not found. The 'badness' of a host (from 0 to 1) is proportional to the amount of secondary content on the host."
Authors: "antonovvk"
Responsibles: "antonovvk"
}
Factor {
Index: 163
CppName: "FI_LINK_AGE"
Name: "LinkAge"
Group: "Xref"
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: "The average age of links that contributed something to LR LinkAge=Min(log(average age of the link)/7, 1), where 1 is considered 3 years"
Responsibles: "alsafr"
}
Factor {
Index: 164
CppName: "FI_TLEN"
Name: "TLen"
AntiSeoUpperBound: 1.0
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The length of the page text in words TLen = Map(the number of words, 1/400), where Map(x, y) = x*y / (1 + x*y)"
Responsibles: "alsafr"
}
Factor {
Index: 165
CppName: "FI_IS_UNREACHABLE"
Name: "IsUnreachable"
Tags: [TG_DOC, TG_STATIC, TG_BINARY, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The page is unreachable via links from homepage."
Authors: "denplusplus"
Responsibles: "alsafr"
}
Factor {
Index: 166
CppName: "FI_LANG_LR_LOG_RELEV"
Name: "XLangLRlogRelev"
Group: "Xref"
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: "LR with taking into account the match of the link language and the query"
Responsibles: "alsafr"
}
Factor {
Index: 167
CppName: "FI_LERF_LANG_LR_LOG_RELEV"
Name: "XLerfLangLRlogRelev"
Group: "Xref"
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: "LR with taking into account the match of the link language, the query, and the boost"
Responsibles: "alsafr"
}
Factor {
Index: 168
CppName: "FI_QUERY_URL_CLICKS_FRC"
Name: "QueryURLClicksFRC"
AntiSeoUpperBound: 0.3
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_REARR_USE, TG_OFTEN_ZERO, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_CLICKS_SHOWS, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Countries: CNT_RELEV
Description: "The ratio of the number of clicks on a given URL to all clicks of the query"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/Клики#queryurldownerclickspctrfrccomboreg>"
Authors: ["lidia", "akhropov"]
Responsibles: ["tarum", "niknik"]
}
Factor {
Index: 169
CppName: "FI_QUERY_DOWNER_CLICKS_FRC"
Name: "QueryDOwnerClicksFRC"
Tags: [TG_DYNAMIC, TG_DOWNER, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_USER_SEARCH_EXTERNAL, TG_REARR_USE, TG_OFTEN_ZERO, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_CLICKS_SHOWS, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Countries: CNT_RELEV
Description: "The ratio of the number of clicks on a given domainId to all clicks of a query"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/Клики#queryurldownerclickspctrfrccomboreg>"
Authors: ["lidia", "akhropov"]
Responsibles: ["tarum", "niknik"]
}
Factor {
Index: 170
CppName: "FI_QUERY_URL_CLICKS_PCTR_COPY"
Name: "QueryURLClicksPCTR_copy"
AntiSeoUpperBound: 0.42
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_REARR_USE, TG_DEPRECATED, TG_L2]
Countries: CNT_RELEV
Description: "[Bug: Factor 45 copy] How often a given URL is clicked for a given query - CTR multiplied by a correction coefficient"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/Клики#queryurldownerclickspctrfrccomboreg>"
Authors: ["akhropov", "solar"]
Responsibles: ["akhropov", "diver"]
}
Factor {
Index: 171
CppName: "FI_DOPP_URL_SESSION_CLICKS_FRC_CITY"
Name: "DoppQueryUrlSessionClicksFRCCity"
Ticket: "FACTOR-311"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/DoppQueryUrlSessionClicksFRC>"
Tags: [TG_USER, TG_USER_SEARCH, TG_DYNAMIC, TG_DOC, TG_LOCALIZED_CITY, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_DOPP, TG_L2, TG_REARR_USE, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_90D, TG_USERFEAT_USF, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Description: "What part (on average for the session) does the given URL make up of the URLs clicked on this query with the user's city added? It's calculated based on user sessions."
Authors: "esoloviev"
Responsibles: ["esoloviev", "kolesov93", "tarum", "niknik"]
}
Factor {
Index: 172
CppName: "FI_QUERY_URL_CLICKS_PCTR_REG"
Name: "QueryURLClicksPCTR_Reg"
AntiSeoUpperBound: 0.4
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_REGION, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_REARR_USE, TG_OFTEN_ZERO, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_CLICKS_SHOWS, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Description: "How often is a given URL clicked on for a given query - CTR multiplied by the correction factor, on small regions from relev_regions.web.txt"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/Клики#queryurldownerclickspctrfrccomboreg>"
Authors: "akhropov"
Responsibles: ["tarum", "niknik"]
}
Factor {
Index: 173
CppName: "FI_QUERY_DOWNER_CLICKS_PCTR_REG"
Name: "QueryDOwnerClicksPCTR_Reg"
Tags: [TG_DYNAMIC, TG_DOWNER, TG_LOCALIZED_REGION, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_USER_SEARCH_EXTERNAL, TG_OFTEN_ZERO, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_CLICKS_SHOWS, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Description: "How often are given domainId URLs clicked on for a given query
CTR domainId multiplied by the correction factor, on small regions from relev_regions.web.txt"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/Клики#queryurldownerclickspctrfrccomboreg>"
Authors: "akhropov"
Responsibles: ["tarum", "niknik"]
}
Factor {
Index: 174
CppName: "FI_QUERY_URL_CLICKS_FRC_REG"
Name: "QueryURLClicksFRC_Reg"
AntiSeoUpperBound: 0.25
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_REGION, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_REARR_USE, TG_OFTEN_ZERO, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_CLICKS_SHOWS, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Description: "The ratio of the number of clicks on a given URL to all clicks of the query, on small regions from relev_regions.web.txt"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/Клики#queryurldownerclickspctrfrccomboreg>"
Authors: "akhropov"
Responsibles: ["tarum", "niknik"]
}
Factor {
Index: 175
CppName: "FI_QUERY_DOWNER_CLICKS_FRC_REG"
Name: "QueryDOwnerClicksFRC_Reg"
Tags: [TG_DYNAMIC, TG_DOWNER, TG_LOCALIZED_REGION, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_USER_SEARCH_EXTERNAL, TG_REARR_USE, TG_OFTEN_ZERO, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_CLICKS_SHOWS, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Description: "The ratio of the number of clicks on a given domainId to all clicks of the query, on small regions from relev_regions.web.txt"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/Клики#queryurldownerclickspctrfrccomboreg>"
Authors: "akhropov"
Responsibles: ["tarum", "niknik"]
}
Factor {
Index: 176
CppName: "FI_QUERY_URL_CLICKS_COMBO_REG"
Name: "QueryURLClicksCombo_Reg"
AntiSeoUpperBound: 0.5
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_REGION, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_OFTEN_ZERO, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_CLICKS_SHOWS, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Description: "Query URL Clicks Combo, for small regions from relev_regions.web.txt"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/Клики#queryurldownerclickspctrfrccomboreg>"
Authors: "akhropov"
Responsibles: ["tarum", "niknik"]
}
Factor {
Index: 177
CppName: "FI_QUERY_DOWNER_CLICKS_COMBO_REG"
Name: "QueryDOwnerClicksCombo_Reg"
Tags: [TG_DYNAMIC, TG_DOWNER, TG_LOCALIZED_REGION, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_USER_SEARCH_EXTERNAL, TG_OFTEN_ZERO, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_CLICKS_SHOWS, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Description: "Query DOwner Clicks Combo, for small regions from relev_regions.web.txt"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/Клики#queryurldownerclickspctrfrccomboreg>"
Authors: "akhropov"
Responsibles: ["tarum", "niknik"]
}
Factor {
Index: 178
CppName: "FI_CATALOG_RELEV"
Name: "XLRCatalogRelev"
AntiSeoUpperBound: 1.0
Group: "Xref"
Tags: [TG_CATALOG, TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_DEPRECATED]
Description: "LR based on catalog descriptions"
Responsibles: "alsafr"
}
Factor {
Index: 179
CppName: "FI_YA_CATALOG_RELEV"
Name: "XLRYaCatalogRelev"
Group: "Xref"
Tags: [TG_CATALOG, TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_DEPRECATED]
Description: "LR based on Yandex.Catalog description"
Responsibles: "alsafr"
}
Factor {
Index: 180
CppName: "FI_EXACT_WORD_ORDER_LEN"
Name: "ExactWordOrderLen"
Group: "CombinedSequences"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_REARR_USE, TG_UNDOCUMENTED, TG_NN_OVER_FEATURES_USE]
Description: "The length of the maximum match of forms in the text and the query"
Authors: "pzuev"
Responsibles: "pzuev"
}
Factor {
Index: 181
CppName: "FI_EXACT_WORD_ORDER_WEIGHT"
Name: "ExactWordOrderWeight"
Group: "CombinedSequences"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_REARR_USE, TG_UNDOCUMENTED, TG_NN_OVER_FEATURES_USE]
Description: "The weight of the maximum match of forms in the text and the query"
Authors: "pzuev"
Responsibles: "pzuev"
}
Factor {
Index: 182
CppName: "FI_WORD_ORDER_LEN"
Name: "WordOrderLen"
Group: "CombinedSequences"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_NN_OVER_FEATURES_USE]
Description: "The length of the maximum match by lemma in the text and the query"
Authors: "pzuev"
Responsibles: "pzuev"
}
Factor {
Index: 183
CppName: "FI_WORD_ORDER_WEIGHT"
Name: "WordOrderWeight"
Group: "CombinedSequences"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_NN_OVER_FEATURES_USE]
Description: "The weight of the maximum match by lemma in the text and query"
Authors: "pzuev"
Responsibles: "pzuev"
}
Factor {
Index: 184
CppName: "FI_LINK_MAX_AGE"
Name: "LinkMaxAge"
Group: "Xref"
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_REARR_USE, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_DEPRECATED]
Description: "The maximum age of a significant amount of links that contributed something to LR"
Authors: "denplusplus"
Responsibles: "alsafr"
}
Factor {
Index: 185
CppName: "FI_TEXT_RELEV_ALL_WORDS_WITH_STOPS"
Name: "TRp1All"
AntiSeoUpperBound: 1.0
Group: "LegacyTR"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_BINARY, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_NN_OVER_FEATURES_USE]
Description: "The variations of corresponding factors considering stop words"
Authors: "denplusplus"
Responsibles: "alsafr"
}
Factor {
Index: 186
CppName: "FI_LINK_RELEV_ALL_WORDS_WITH_STOPS"
Name: "LRp1All"
AntiSeoUpperBound: 1.0
Group: "LegacyLR"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_BINARY, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_NN_OVER_FEATURES_USE]
Description: "The variations of corresponding factors considering stop words"
Authors: "denplusplus"
Responsibles: "alsafr"
}
Factor {
Index: 187
CppName: "FI_TLP1_ALL"
Name: "TLp1All"
Group: "TextAndLinkBM25"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_BINARY, TG_UNDOCUMENTED, TG_L2, TG_LINK_TEXT, TG_DEPRECATED]
Description: "The variations of corresponding factors considering stop words"
Authors: "denplusplus"
Responsibles: "alsafr"
}
Factor {
Index: 188
CppName: "FI_BF_EXACT_ALL"
Name: "BFexactAll"
Group: "BestForm"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_BINARY, TG_UNDOCUMENTED, TG_LINK_TEXT, TG_DEPRECATED]
Description: "The variations of corresponding factors considering stop words"
Authors: "denplusplus"
Responsibles: "alsafr"
}
Factor {
Index: 189
CppName: "FI_BF_LEMMA_ALL"
Name: "BFlemmaAll"
Group: "BestForm"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_BINARY, TG_UNDOCUMENTED, TG_LINK_TEXT, TG_DEPRECATED]
Description: "The variations of corresponding factors considering stop words"
Authors: "denplusplus"
Responsibles: "alsafr"
}
Factor {
Index: 190
CppName: "FI_PASSAGE_LEGACY_TR"
Name: "PassageLegacyTR"
Group: "Dynamic"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_REARR_USE, TG_UNDOCUMENTED, TG_NN_OVER_FEATURES_USE]
Description: "TR of the best passage - how high the quality of the snippet can be"
Responsibles: "alsafr"
}
Factor {
Index: 191
CppName: "FI_TEXT_BM25_ATTEN_SYN"
Name: "TxtBM25AttenSyn"
Group: "TextBM25"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "TR with a discount for the sentence number"
Authors: "pzuev"
Responsibles: "pzuev"
}
Factor {
Index: 192
CppName: "FI_MAX_WORD_HOST_RANK"
Name: "MaxWordHostRank"
Group: "Domain"
Tags: [TG_DYNAMIC, TG_DOWNER, TG_LINK_TEXT, TG_LINK_GRAPH, TG_DEPRECATED]
Description: "The host rank for the most expressed query word (usually it's the name of the website)"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/Domfeat/PWR>"
Authors: "finder"
Responsibles: "akhropov"
}
Factor {
Index: 193
CppName: "FI_MAX_WORD_HOST_CLICKS"
Name: "MaxWordHostClicks"
Group: "Domain"
Tags: [TG_DYNAMIC, TG_DOWNER, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_DEPRECATED]
Description: "The clickability of domAttr based on the most expressed word. For example, for all queries that contain the word Wikipedia, the Wikipedia pages are clicked on."
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/Domfeat/WHC>"
Authors: "finder"
Responsibles: "akhropov"
}
Factor {
Index: 194
CppName: "FI_DOM_PHRASE_RANK"
Name: "DomPhraseRank"
Group: "Domain"
Tags: [TG_DYNAMIC, TG_DOWNER, TG_LINK_TEXT, TG_LINK_GRAPH, TG_DEPRECATED]
Description: "HostRank based on individual words"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/Domfeat/PWR>"
Authors: "finder"
Responsibles: "akhropov"
}
Factor {
Index: 195
CppName: "FI_DOM_PHRASE_CLICK_RANK"
Name: "DomPhraseClickRank"
Group: "Domain"
Tags: [TG_DYNAMIC, TG_DOWNER, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_DEPRECATED]
Description: "The clickability of the domain based on words"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/Domfeat/WHC>"
Authors: "finder"
Responsibles: "akhropov"
}
Factor {
Index: 196
CppName: "FI_IS_FORUM"
Name: "IsForum"
Ticket: ["BUKI-1543", "SEARCHSPAM-3650"]
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/IsForum>"
Tags: [TG_DOC, TG_STATIC, TG_URL_TEXT, TG_BINARY, TG_REARR_USE, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The URL satisfies the regular FORUM_DETECTOR"
Authors: "zudina"
Responsibles: "zudina"
}
Factor {
Index: 197
CppName: "FI_ALICE_MUSIC_TRACK_TITLE_ANNOTATION_MATCH_WEIGHTED_VALUE"
Name: "AliceMusicTrackTitleAnnotationMatchWeightedValue"
Tags: [TG_UNUSED, TG_DYNAMIC, TG_DOC, TG_ALICE_MUSIC, TG_ANNOTATION_NOFILTER, TG_TEXT_MACHINE, TG_ALLOW_USE_FOR_ALICE]
Description: "AnnotationMatchWeightedValue factor value for the AliceMusic stream"
Wiki: "<https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/lingboost>"
Ticket: ["BUKI-2932"]
Authors: "anrodigina"
Responsibles: ["anrodigina", "gotmanov", "hommforever"]
ImplementationTime: "2020-03-11"
}
Factor {
Index: 198
CppName: "FI_IS_OBSOLETE"
Name: "IsObsolete"
Tags: [TG_DATE, TG_DOC, TG_STATIC, TG_URL_TEXT, TG_BINARY, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "URL contains old date. We can recognize old news. Factor 1 if the URL contains year <=2007."
Authors: "finder"
Responsibles: "finder"
}
Factor {
Index: 199
CppName: "FI_TR_WITH_STOPS"
Name: "TRWithStops"
AntiSeoUpperBound: 1.0
Group: "LegacyTR"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_NN_OVER_FEATURES_USE]
Description: "The weight of the maximum form match in the text and the query"
Authors: "denplusplus"
Responsibles: "alsafr"
}
Factor {
Index: 200
CppName: "FI_LR_WITH_STOPS"
Name: "LRWithStops"
AntiSeoUpperBound: 1.0
Group: "Dynamic"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_UNUSED]
Description: "The weight of the maximum form match in the text and the query"
Authors: "denplusplus"
Responsibles: "alsafr"
}
Factor {
Index: 201
CppName: "FI_HAS_PAYMENTS"
Name: "HasPayments"
AntiSeoUpperBound: 1.0
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_BINARY, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The page contains information about 'SMS payment'."
Authors: "denplusplus"
Responsibles: "alsafr"
}
Factor {
Index: 202
CppName: "FI_IS_LINK_PESSIMISED"
Name: "IsLinkPessimised"
Tags: [TG_OWNER, TG_STATIC, TG_BINARY, TG_DEPRECATED, TG_OFTEN_ZERO]
Description: "The anti-spammers have pessimized the site - all dynamic linking factors are reset to 0. zerolnk.flt"
Authors: "zudina"
Responsibles: "zudina"
}
Factor {
Index: 203
CppName: "FI_ESHOP_VALUE"
Name: "EshopValue"
AntiSeoUpperBound: 1.0
Tags: [TG_COMMERCIAL, TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "Can people buy anything on the page?"
Authors: "asavin"
Responsibles: "asavin"
}
Factor {
Index: 204
CppName: "FI_PORNO_VALUE"
Name: "PornoValue"
AntiSeoUpperBound: 1.0
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "Is it the page with porno?"
Authors: "asavin"
Responsibles: "asavin"
}
Factor {
Index: 205
CppName: "FI_TRAFGRAPH_OUT_ALL_SHARE_M"
Name: "TrafgraphOutAll_share_m"
Tags: [TG_OWNER, TG_STATIC, TG_OFTEN_ZERO, TG_COMMERCIAL, TG_NN_OVER_FEATURES_USE]
Description: "Remapped mascot feature TrafgraphOutAll_share_m"
Ticket: "SEARCHSPAM-15531"
Authors: ["bikulov"]
Responsibles: ["bikulov", "sdormidontov"]
ImplementationTime: "2020-09-30"
}
Factor {
Index: 206
CppName: "FI_TRAFGRAPH_OUT_ALL_SE_SHARE_D"
Name: "TrafgraphOutAllSE_share_d"
Tags: [TG_OWNER, TG_STATIC, TG_OFTEN_ZERO, TG_COMMERCIAL, TG_NN_OVER_FEATURES_USE]
Description: "Remapped mascot feature TrafgraphOutAllSE_share_d"
Ticket: "SEARCHSPAM-15531"
Authors: ["bikulov"]
Responsibles: ["bikulov", "sdormidontov"]
ImplementationTime: "2020-09-30"
}
Factor {
Index: 207
CppName: "FI_TRAFGRAPH_OUT_ALL_SE_SHARE_M"
Name: "TrafgraphOutAllSE_share_m"
Ticket: "SEARCHSPAM-15531"
Authors: ["bikulov"]
Responsibles: ["bikulov", "sdormidontov"]
Description: "Remapped mascot feature TrafgraphOutAllSE_share_m"
Tags: [TG_OWNER, TG_STATIC, TG_OFTEN_ZERO, TG_UNUSED, TG_UNIMPLEMENTED],
}
Factor {
Index: 208
CppName: "FI_NO_EXT_CLICKS_SHARE"
Name: "NoExtClicksShare"
Ticket: "SEARCHSPAM-15531"
Authors: ["bikulov"]
Responsibles: ["bikulov", "sdormidontov"]
Description: "Remapped mascot feature NoExtClicksShare"
Tags: [TG_OWNER, TG_STATIC, TG_OFTEN_ZERO, TG_UNUSED, TG_UNIMPLEMENTED],
}
Factor {
Index: 209
CppName: "FI_COUNTERS_SEARCH_TRAFFIC1"
Name: "CountersSearchTraffic1"
AntiSeoUpperBound: 1.0
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/usercounteractions/Simple>"
Tags: [TG_STATIC, TG_OWNER, TG_USER, TG_COUNTER, TG_UNUSED, TG_L2]
Description: "The search traffic - clicks from search engines on the website (the 2nd formula)"
Authors: ["amotuzov", "denplusplus"]
Responsibles: "smikler"
}
Factor {
Index: 210
CppName: "FI_COUNTERS_SEARCH_TRAFFIC2"
Name: "CountersSearchTraffic2"
AntiSeoUpperBound: 1.0
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/usercounteractions/Simple>"
Tags: [TG_STATIC, TG_OWNER, TG_USER, TG_COUNTER, TG_UNUSED, TG_L2]
Description: "The search traffic - clicks from search engines on the website (the 2nd formula)"
Authors: ["amotuzov", "denplusplus"]
Responsibles: "smikler"
}
Factor {
Index: 211
CppName: "FI_DOM_PHRASE_YABAR"
Name: "DomPhraseYabar"
Group: "Domain"
Tags: [TG_DYNAMIC, TG_DOWNER, TG_USER, TG_BROWSER, TG_USER_SEARCH, TG_DEPRECATED]
Description: "Traffic to the website from search engines via individual words, according to the bar"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/Domfeat/WHC>"
Authors: "finder"
Responsibles: "akhropov"
}
Factor {
Index: 212
CppName: "FI_ALICE_MUSIC_ARTIST_NAME_BCLM_MIX_PLAIN_KE5"
Name: "AliceMusicArtistNameBclmMixPlainK000001"
Tags: [TG_UNUSED, TG_DYNAMIC, TG_DOC, TG_ANNOTATION_NOFILTER, TG_TEXT_MACHINE, TG_ALICE_MUSIC, TG_ALLOW_USE_FOR_ALICE]
Description: "The BclmMixPlainK000001 factor value for the AliceMusic stream"
Wiki: "<https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/lingboost>"
Ticket: ["BUKI-2932"]
Authors: "anrodigina"
Responsibles: ["anrodigina", "gotmanov", "hommforever"]
ImplementationTime: "2020-03-11"
}
Factor {
Index: 213
CppName: "FI_QUERY_URL_LCS"
Name: "QueryUrlLCS"
Tags: [TG_DYNAMIC, TG_DOC, TG_URL_TEXT, TG_L2, TG_NN_OVER_FEATURES_USE, TG_FORMULA_2245_DEP_2, TG_DEPRECATED]
Wiki: "<http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/QueryUrlLCS>"
Ticket: "FACTOR-417"
Description: "The largest common substring of URL and query, normalized by the URL's length"
Authors: ["mbusel", "tsimkha", "alsafr"]
Responsibles: ["mbusel", "tsimkha"]
}
Factor {
Index: 214
CppName: "FI_ONLY_URL"
Name: "OnlyUrl"
Group: "UrlBM25"
Wiki: "<http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/OnlyUrl>"
Tags: [TG_DOC, TG_DYNAMIC, TG_URL_TEXT, TG_BINARY, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "All matches are found only in the URL, there are no matches in the page text"
Authors: "denplusplus"
Responsibles: ["alsafr", "stash93"]
}
Factor {
Index: 215
CppName: "FI_GEO_RELEV_REGION_CITY"
Name: "GeoRelevRegionCity"
AntiSeoUpperBound: 1.0
Tags: [TG_DOC, TG_DYNAMIC, TG_LOCALIZED_CITY, TG_BINARY, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Authors: "denplusplus"
Responsibles: "alsafr"
}
Factor {
Index: 216
CppName: "FI_GEO_RELEV_REGION_REGION"
Name: "GeoRelevRegionRegion"
AntiSeoUpperBound: 1.0
Tags: [TG_DOC, TG_DYNAMIC, TG_LOCALIZED_REGION, TG_BINARY, TG_REARR_USE, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Authors: "denplusplus"
Responsibles: "alsafr"
}
Factor {
Index: 217
CppName: "FI_GEO_RELEV_REGION_COUNTRY"
Name: "GeoRelevRegionCountry"
AntiSeoUpperBound: 1.0
Tags: [TG_DOC, TG_DYNAMIC, TG_LOCALIZED_COUNTRY, TG_BINARY, TG_REARR_USE, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L3_OVERWRITE, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "Three levels of the match between the geography of the user and the page"
Authors: "denplusplus"
Responsibles: "alsafr"
}
Factor {
Index: 218
CppName: "FI_LR_GEO_RELEV_REGION_CITY"
Name: "XLRGeoRelevRegionCity"
AntiSeoUpperBound: 1.0
Group: "Xref"
Tags: [TG_DOC, TG_DYNAMIC, TG_LOCALIZED_CITY, TG_LINK_TEXT, TG_REARR_USE, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_DEPRECATED]
Authors: "denplusplus"
Responsibles: "alsafr"
}
Factor {
Index: 219
CppName: "FI_LR_GEO_RELEV_REGION_REGION"
Name: "XLRGeoRelevRegionRegion"
AntiSeoUpperBound: 1.0
Group: "Xref"
Tags: [TG_DOC, TG_DYNAMIC, TG_LOCALIZED_REGION, TG_LINK_TEXT, TG_REARR_USE, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_DEPRECATED]
Authors: "denplusplus"
Responsibles: "alsafr"
}
Factor {
Index: 220
CppName: "FI_LR_GEO_RELEV_REGION_COUNTRY"
Name: "XLRGeoRelevRegionCountry"
AntiSeoUpperBound: 1.0
Group: "Xref"
Tags: [TG_DOC, TG_DYNAMIC, TG_LOCALIZED_COUNTRY, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_UNUSED]
Description: "Three levels of the match between the link region and query"
Authors: "denplusplus"
Responsibles: "alsafr"
}
Factor {
Index: 221
CppName: "FI_GEO_COUNTRY_PROXIM"
Name: "GeoCountryProxim"
Tags: [TG_DOC, TG_DYNAMIC, TG_LOCALIZED_COUNTRY, TG_BINARY, TG_REARR_USE, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "Geographic proximity"
Authors: "denplusplus"
Responsibles: "alsafr"
}
Factor {
Index: 222
CppName: "FI_IS_NAV_QUERY"
Name: "IsNavQuery"
DependsOn: [{Feature: ["IsNavQuery"], Slice: "begemot_query_factors"}]
Group: "Query"
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_NAV, TG_BINARY, TG_REARR_USE, TG_OFTEN_ZERO, TG_L2, TG_USERFEAT, TG_USERFEAT_90D, TG_DEPRECATED]
Description: "Is the query navigational, based on the clickability of the answers"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/IsNav>"
Authors: ["akhropov", "denplusplus", "prs"]
Responsibles: ["tarum", "niknik"]
UseArtifact: {Name: "IsNavTrie"}
}
Factor {
Index: 223
CppName: "FI_MAX_WORD_HOST_YABAR"
Name: "MaxWordHostYaBar"
Group: "Domain"
Tags: [TG_DYNAMIC, TG_DOWNER, TG_USER, TG_BROWSER, TG_USER_SEARCH, TG_REARR_USE, TG_DEPRECATED, TG_OFTEN_ZERO]
Description: "The most suitable query word describing the website, based on the Yandex Bar data"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/Domfeat/WHC>"
Authors: "finder"
Responsibles: "akhropov"
}
Factor {
Index: 224
CppName: "FI_FIRST_WORD_HOST_CLICKS"
Name: "FirstWordHostClicks"
Group: "Domain"
Tags: [TG_DYNAMIC, TG_DOWNER, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_DEPRECATED, TG_OFTEN_ZERO]
Description: "Clickability of the host for the first word of the query. Quite often, the first (last) query word is an explicit indication of the website where we should look for information."
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/Domfeat/WHC>"
Authors: "finder"
Responsibles: "akhropov"
}
Factor {
Index: 225
CppName: "FI_ALICE_MUSIC_ARTIST_NAME_CMMATCH_TOP5_AVG_MATCH"
Name: "AliceMusicArtistNameCMMatchTop5AvgMatch"
Tags: [TG_UNUSED, TG_DYNAMIC, TG_DOC, TG_ALICE_MUSIC, TG_ANNOTATION_NOFILTER, TG_TEXT_MACHINE, TG_ALLOW_USE_FOR_ALICE]
Description: "The CMMatchTop5AvgMatch factor value for the AliceMusic stream"
Wiki: "<https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/lingboost>"
Ticket: ["BUKI-2932"]
Authors: "anrodigina"
Responsibles: ["anrodigina", "gotmanov", "hommforever"]
ImplementationTime: "2020-03-11"
}
Factor {
Index: 226
CppName: "FI_QUERY_DOWNER_YABAR_VISITS"
Name: "QueryDOwnerYabarVisits"
Tags: [TG_DYNAMIC, TG_DOWNER, TG_USER, TG_BROWSER, TG_USER_SEARCH, TG_USER_SEARCH_EXTERNAL, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_238D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_VISITS_ACTIVITY_DOWNLOADS, TG_FORMULA_2245_DEP_5, TG_DEPRECATED]
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/userbrowsingactions/>"
Authors: "akhropov"
Responsibles: ["tarum", "niknik"]
}
Factor {
Index: 227
CppName: "FI_QUERY_DOWNER_YABAR_VISITORS"
Name: "QueryDOwnerYabarVisitors"
Tags: [TG_DYNAMIC, TG_DOWNER, TG_USER, TG_BROWSER, TG_USER_SEARCH, TG_USER_SEARCH_EXTERNAL, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_238D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_VISITS_ACTIVITY_DOWNLOADS, TG_FORMULA_2245_DEP_5, TG_DEPRECATED]
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/userbrowsingactions/>"
Authors: "akhropov"
Responsibles: ["tarum", "niknik"]
}
Factor {
Index: 228
CppName: "FI_QUERY_DOWNER_YABAR_AVG_TIME"
Name: "QueryDOwnerYabarAvgTime"
Tags: [TG_DYNAMIC, TG_DOWNER, TG_USER, TG_BROWSER, TG_USER_SEARCH, TG_USER_SEARCH_EXTERNAL, TG_L2, TG_REARR_USE, TG_SAMOHOD_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_238D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_VISITS_ACTIVITY_DOWNLOADS, TG_FORMULA_2245_DEP_5, TG_DEPRECATED]
Description: "Average (among users) active continuous time spent by a user (in seconds) on the host's pages after clicking on a query in SERP (the factor depends on the pair (query,domAttr))."
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/userbrowsingactions/>"
Authors: "akhropov"
Responsibles: ["tarum", "niknik"]
}
Factor {
Index: 229
CppName: "FI_QUERY_DOWNER_YABAR_AVG_TIME2"
Name: "QueryDOwnerYabarAvgTime2"
Tags: [TG_DYNAMIC, TG_DOWNER, TG_USER, TG_BROWSER, TG_USER_SEARCH, TG_USER_SEARCH_EXTERNAL, TG_REARR_USE, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_238D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_VISITS_ACTIVITY_DOWNLOADS, TG_FORMULA_2245_DEP_5, TG_DEPRECATED]
Description: "Average (among users) active continuous time spent by a user (in seconds) on the host's pages after clicking on a query in SERP (the factor depends on the pair (query,domAttr)). Based on the internal counter of Yandex.Bar/Elements/Browser"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/userbrowsingactions/>"
Authors: "akhropov"
Responsibles: ["tarum", "niknik"]
}
Factor {
Index: 230
CppName: "FI_QUERY_DOWNER_YABAR_AVG_ACTIONS"
Name: "QueryDOwnerYabarAvgActions"
Tags: [TG_DYNAMIC, TG_DOWNER, TG_USER, TG_BROWSER, TG_USER_SEARCH, TG_USER_SEARCH_EXTERNAL, TG_L2, TG_REARR_USE, TG_SAMOHOD_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_238D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_VISITS_ACTIVITY_DOWNLOADS, TG_FORMULA_2245_DEP_5, TG_DEPRECATED]
Description: "The average number (among users) of active actions (clicks, keystrokes) on the host pages after clicking on the website in SERP (the factor depends on the pair (query, domAttr)). Based on the internal counter of Yandex.Bar/Elements/Browser"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/userbrowsingactions/>"
Authors: "akhropov"
Responsibles: ["tarum", "niknik"]
}
Factor {
Index: 231
CppName: "FI_QUERY_URL_YABAR_VISITS"
Name: "QueryUrlYabarVisits"
AntiSeoUpperBound: 1.0
Tags: [TG_DYNAMIC, TG_DOC, TG_USER, TG_BROWSER, TG_USER_SEARCH, TG_DEPRECATED, TG_L2]
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/userbrowsingactions/>"
Authors: "akhropov"
Responsibles: ["akhropov", "diver"]
}
Factor {
Index: 232
CppName: "FI_QUERY_URL_YABAR_VISITORS"
Name: "QueryUrlYabarVisitors"
AntiSeoUpperBound: 1.0
Tags: [TG_DYNAMIC, TG_DOC, TG_USER, TG_BROWSER, TG_USER_SEARCH, TG_REARR_USE, TG_DEPRECATED, TG_L2]
Description: "A number of unique visitors from search engines based on a specific query"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/userbrowsingactions/>"
Authors: "akhropov"
Responsibles: ["akhropov", "diver"]
}
Factor {
Index: 233
CppName: "FI_QUERY_URL_YABAR_AVG_TIME"
Name: "QueryUrlYabarAvgTime"
AntiSeoUpperBound: 1.0
Tags: [TG_DYNAMIC, TG_DOC, TG_USER, TG_BROWSER, TG_USER_SEARCH, TG_DEPRECATED, TG_L2]
Description: "Average (among users) active continuous time spent by a user (in seconds) on the page after clicking on it in SERP (the factor depends on the pair (query,URL))."
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/userbrowsingactions/>"
Authors: "akhropov"
Responsibles: ["akhropov", "diver"]
}
Factor {
Index: 234
CppName: "FI_QUERY_URL_YABAR_AVG_TIME2"
Name: "QueryUrlYabarAvgTime2"
AntiSeoUpperBound: 1.0
Tags: [TG_DYNAMIC, TG_DOC, TG_USER, TG_BROWSER, TG_USER_SEARCH, TG_DEPRECATED, TG_L2]
Description: "Average (among users) active continuous time spent by a user (in seconds) on the page after clicking on it in SERP (the factor depends on the pair (query,URL)). Based on the internal counter of Yandex.Bar/Elements/Browser"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/userbrowsingactions/>"
Authors: "akhropov"
Responsibles: ["akhropov", "diver"]
}
Factor {
Index: 235
CppName: "FI_QUERY_URL_YABAR_AVG_ACTIONS"
Name: "QueryUrlYabarAvgActions"
AntiSeoUpperBound: 1.0
Tags: [TG_DYNAMIC, TG_DOC, TG_USER, TG_BROWSER, TG_USER_SEARCH, TG_DEPRECATED, TG_L2]
Description: "The average number (among users) of active actions (clicks, keystrokes) on the page after clicking on it in SERP (the factor depends on the pair (query, URL))."
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/userbrowsingactions/>"
Authors: "akhropov"
Responsibles: ["akhropov", "diver"]
}
Factor {
Index: 236
CppName: "FI_DSSM_BERT_DISTILL_SINSIG_MSE_BASE_REG_CHAIN"
Name: "DssmBertDistillSinsigMseBaseRegChain"
Tags: [TG_REMOVED]
Description: "A set of PRS logs is marked up using Bert trained on sinsig. A dssm model is trained on this set using BaseRegionChain"
UseArtifact: {Name: "DssmBertDistillSinsigMseBaseRegChain"}
Ticket: "FACTOR-2287"
Authors: ["ivaninap", "rmplstiltskin"]
Responsibles: ["ivaninap", "rmplstiltskin"]
ImplementationTime: "2020-02-21"
}
Factor {
Index: 237
CppName: "FI_DSSM_BERT_DISTILL_RELEVANCE_MSE_BASE_REG_CHAIN"
Name: "DssmBertDistillRelevanceMseBaseRegChain"
Tags: [TG_REMOVED]
Description: "A set of PRS logs is marked up using Bert trained on relevance. A dssm model is trained on this set using BaseRegionChain"
UseArtifact: {Name: "DssmBertDistillRelevanceMseBaseRegChain"}
Ticket: "FACTOR-2287"
Authors: ["ivaninap", "rmplstiltskin"]
Responsibles: ["ivaninap", "rmplstiltskin"]
ImplementationTime: "2020-02-21"
}
Factor {
Index: 238
CppName: "FI_ALICE_MUSIC_ARTIST_NAME_PER_WORD_CM_MAX_MATCH_MIN"
Name: "AliceMusicArtistNamePerWordCMMaxMatchMin"
Tags: [TG_UNUSED, TG_DYNAMIC, TG_DOC, TG_ALICE_MUSIC, TG_ANNOTATION_NOFILTER, TG_TEXT_MACHINE, TG_ALLOW_USE_FOR_ALICE]
Description: "The PerWordCMMaxMatchMin factor value for the AliceMusic stream"
Wiki: "<https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/lingboost>"
Ticket: ["BUKI-2932"]
Authors: "anrodigina"
Responsibles: ["anrodigina", "gotmanov", "hommforever"]
ImplementationTime: "2020-03-11"
}
Factor {
Index: 239
CppName: "FI_ALICE_MUSIC_ARTIST_NAME_ATTENV1_BM15_K05"
Name: "AliceMusicArtistNameAttenV1_Bm15_K05"
Tags: [TG_UNUSED, TG_DYNAMIC, TG_DOC, TG_ALICE_MUSIC, TG_ANNOTATION_NOFILTER, TG_TEXT_MACHINE, TG_ALLOW_USE_FOR_ALICE]
Description: "The AttenV1_Bm15_K05 factor value for the AliceMusic stream"
Wiki: "<https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/lingboost>"
Ticket: ["BUKI-2932"]
Authors: "anrodigina"
Responsibles: ["anrodigina", "gotmanov", "hommforever"]
ImplementationTime: "2020-03-11"
}
Factor {
Index: 240
CppName: "FI_ALICE_MUSIC_ALBUM_TITLE_ANNOTATION_MAX_VALUE_WEIGHTED"
Name: "AliceMusicAlbumTitleAnnotationMaxValueWeighted"
Tags: [TG_UNUSED, TG_DYNAMIC, TG_DOC, TG_ALICE_MUSIC, TG_ANNOTATION_NOFILTER, TG_TEXT_MACHINE, TG_ALLOW_USE_FOR_ALICE]
Description: "The AnnotationMaxValueWeighted factor value for the AliceMusic stream"
Wiki: "<https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/lingboost>"
Ticket: ["BUKI-2932"]
Authors: "anrodigina"
Responsibles: ["anrodigina", "gotmanov", "hommforever"]
ImplementationTime: "2020-03-11"
}
Factor {
Index: 241
CppName: "FI_IS_FOREIGN_QUERY"
Name: "IsForeignQuery"
DependsOn: [{Feature: ["IsForeignQuery"], Slice: "begemot_query_factors"}]
Group: "Query"
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_BINARY, TG_REARR_USE, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_DEPRECATED]
Description: "The query is not in Russian"
Authors: "denplusplus"
Responsibles: "alsafr"
UseArtifact: {Name: "QueryLang"}
}
Factor {
Index: 242
CppName: "FI_IS_FOREIGN_CLUSTER"
Name: "IsForeignCluster"
Tags: [TG_DOC, TG_STATIC, TG_BINARY, TG_REARR_USE, TG_DEPRECATED, TG_OFTEN_ZERO]
Description: "The document is from a foreign cluster"
Responsibles: "alsafr"
}
Factor {
Index: 243
CppName: "FI_PAGE_REGION_SIZE_IN"
Name: "PageRegionSizeIn"
Tags: [TG_DOC, TG_STATIC, TG_STATIC_REGINFO, TG_UNDOCUMENTED, TG_L2, TG_L3_OVERWRITE, TG_NN_OVER_FEATURES_USE]
Description: "The size of the page region"
Authors: "denplusplus"
Responsibles: "alsafr"
}
Factor {
Index: 244
CppName: "FI_PAGE_REGION_INV_SIZE_IN"
Name: "PageRegionInvSizeIn"
Tags: [TG_DOC, TG_STATIC, TG_STATIC_REGINFO, TG_UNDOCUMENTED, TG_L2, TG_L3_OVERWRITE, TG_NN_OVER_FEATURES_USE]
Description: "The factor is inversely proportional to the size of the page region"
Authors: "denplusplus"
Responsibles: "alsafr"
CanonicalValue: 1.0
}
Factor {
Index: 245
CppName: "FI_QUERY_REGION_SIZE"
Name: "QueryRegionSize"
Group: "Query"
Tags: [TG_DYNAMIC, TG_LOCALIZED_CITY, TG_QUERY_ONLY, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The size of the query region"
Authors: "denplusplus"
Responsibles: "alsafr"
}
Factor {
Index: 246
CppName: "FI_QUERY_REGION_INV_SIZE"
Name: "QueryRegionInvSize"
Group: "Query"
Tags: [TG_DYNAMIC, TG_LOCALIZED_CITY, TG_QUERY_ONLY, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The factor is inversely proportional to the size of the query region"
Authors: "denplusplus"
Responsibles: "alsafr"
}
Factor {
Index: 247
CppName: "FI_GEO_GEOMETRY_PROXIM"
Name: "GeoGeometryProxim"
Tags: [TG_DOC, TG_DYNAMIC, TG_LOCALIZED_CITY, TG_UNDOCUMENTED, TG_L2, TG_REARR_USE, TG_L3_OVERWRITE, TG_NN_OVER_FEATURES_USE]
Description: "Geographical сloseness of the user and the website"
Authors: "denplusplus"
Responsibles: "alsafr"
}
Factor {
Index: 248
CppName: "FI_RINGS_HOST_RANK_BADNESS_OLD"
Name: "RingsHostRankBadnessOld"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/antispam?v=181r#h58953-4>"
Tags: [TG_OWNER, TG_STATIC, TG_DEPRECATED]
Description: "It characterizes the level of growth of the website by link circles. The value is the share of external links that are included in link circles and link exchanges."
Authors: ["denplusplus", "raigorodsky"]
Responsibles: ["raigorodsky", "alsafr"]
}
Factor {
Index: 249
CppName: "FI_YABAR_HOST_VISITORS"
Name: "YabarHostVisitors"
Tags: [TG_STATIC, TG_HOST, TG_USER, TG_BROWSER, TG_L2, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_VISITS_ACTIVITY_DOWNLOADS]
Description: "The number of unique visitors, which is remapped exponentially"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/userbrowsingactions/#2008>"
Authors: "akhropov"
Responsibles: ["tarum", "niknik"]
}
Factor {
Index: 250
CppName: "FI_YABAR_HOST_SEARCH_TRAFFIC"
Name: "YabarHostSearchTraffic"
Tags: [TG_STATIC, TG_HOST, TG_USER, TG_BROWSER, TG_L2, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_VISITS_ACTIVITY_DOWNLOADS]
Description: "The percentage of traffic from the search engines"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/userbrowsingactions/#2008>"
Authors: "akhropov"
Responsibles: ["tarum", "niknik"]
}
Factor {
Index: 251
CppName: "FI_YABAR_HOST_INTERNAL_TRAFFIC"
Name: "YabarHostInternalTraffic"
Tags: [TG_STATIC, TG_HOST, TG_USER, TG_BROWSER, TG_REARR_USE, TG_L2, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_VISITS_ACTIVITY_DOWNLOADS]
Description: "The percentage of website visits that came from different sources excluding the usage links (only direct traffic or via bookmarks)"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/userbrowsingactions/#2008>"
Authors: "akhropov"
Responsibles: ["tarum", "niknik"]
}
Factor {
Index: 252
CppName: "FI_YABAR_HOST_AVG_TIME"
Name: "YabarHostAvgTime"
Tags: [TG_STATIC, TG_HOST, TG_USER, TG_BROWSER, TG_L2, TG_REARR_USE, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_VISITS_ACTIVITY_DOWNLOADS]
Description: "The average (among users) active continuous time (in seconds) spent by a user on host pages"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/userbrowsingactions/#2008>"
Authors: "akhropov"
Responsibles: ["tarum", "niknik"]
}
Factor {
Index: 253
CppName: "FI_YABAR_HOST_AVG_TIME2"
Name: "YabarHostAvgTime2"
Tags: [TG_STATIC, TG_HOST, TG_USER, TG_BROWSER, TG_L2, TG_REARR_USE, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_VISITS_ACTIVITY_DOWNLOADS]
Description: "The average (among users) active continuous time (in seconds) spent by a user on host pages. According to the internal counter of Yandex.Bar/Elements/Browser"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/userbrowsingactions/#2008>"
Authors: "akhropov"
Responsibles: ["tarum", "niknik"]
}
Factor {
Index: 254
CppName: "FI_YABAR_HOST_AVG_ACTIONS"
Name: "YabarHostAvgActions"
Tags: [TG_STATIC, TG_HOST, TG_USER, TG_BROWSER, TG_L2, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_VISITS_ACTIVITY_DOWNLOADS]
Description: "The average number (among users) of active actions (clicks, keystrokes) when the user is continuously (in seconds) on the host pages."
Authors: "akhropov"
Responsibles: ["tarum", "niknik"]
}
Factor {
Index: 255
CppName: "FI_YABAR_HOST_BROWSE_RANK"
Name: "YabarHostBrowseRank"
Tags: [TG_STATIC, TG_HOST, TG_USER, TG_BROWSER, TG_L2, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_BROWSER_PAGE_RANK, TG_USERFEAT]
Description: "The implementation of the algorithm described in the article ((<http://wiki.yandex-team.ru//h.yandex.net/?http%3A%2F%2Fresearch.microsoft.com%2Fen-us%2Fpeople%2Ftyliu%2Ffp032-liu.pdf> <http://research.microsoft.com/en-us/people/tyliu/fp032-liu.pdf>))"
Authors: "akhropov"
Responsibles: ["tarum", "niknik"]
}
Factor {
Index: 256
CppName: "FI_YABAR_URL_VISITS"
Name: "YabarUrlVisits"
Tags: [TG_STATIC, TG_DOC, TG_USER, TG_BROWSER, TG_L2, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_VISITS_ACTIVITY_DOWNLOADS]
Description: "URL traffic based on I-bar"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/YabarUrlFactors>"
Authors: "akhropov"
Responsibles: ["tarum", "niknik"]
}
Factor {
Index: 257
CppName: "FI_YABAR_URL_VISITORS"
Name: "YabarUrlVisitors"
Tags: [TG_STATIC, TG_DOC, TG_USER, TG_BROWSER, TG_L2, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_VISITS_ACTIVITY_DOWNLOADS]
Description: "The number of URL's unique visitors"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/YabarUrlFactors>"
Authors: "akhropov"
Responsibles: ["tarum", "niknik"]
}
Factor {
Index: 258
CppName: "FI_YABAR_URL_AVG_TIME"
Name: "YabarUrlAvgTime"
Tags: [TG_STATIC, TG_DOC, TG_USER, TG_BROWSER, TG_REARR_USE, TG_L2, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_VISITS_ACTIVITY_DOWNLOADS]
Description: "The average time (among users) a user spends on a page. It is calculated as the difference between close visits."
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/YabarUrlFactors>"
Authors: "akhropov"
Responsibles: ["tarum", "niknik"]
}
Factor {
Index: 259
CppName: "FI_OWNER_SATISFIED4_RATE"
Name: "OwnerSatisfied4Rate"
Ticket: "BUKI-955"
Wiki: "<http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/obshayaformula/tekushhiekomponenty/OwnerSatisfied4Rate>"
Tags: [TG_STATIC, TG_OWNER, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_L2, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_90D, TG_USERFEAT_USF, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Description: "This is the SEA factor = s4_r/ (k_r+10) where s4_r - is a number of clicks > 180 sec, k_r - the total number of clicks."
Authors: ["popescul", "cliff", "akhropov", "angshu"]
Responsibles: ["tarum", "niknik"]
}
Factor {
Index: 260
CppName: "FI_OWNER_SATISFIED4_RATE_REG"
Name: "OwnerSatisfied4Rate_Reg"
Ticket: "BUKI-955"
Wiki: "<http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/obshayaformula/tekushhiekomponenty/OwnerSatisfied4Rate>"
Group: "RegHostStatic"
Tags: [TG_STATIC, TG_OWNER, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_L2, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_90D, TG_USERFEAT_USF, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Countries: CNT_RELEV
Description: "This is the SEA factor = s4_r/ (k_r+10) where s4_r - is a number of clicks > 180 сек, k_r - the total number of clicks. A localized version"
Authors: ["popescul", "cliff", "akhropov", "angshu"]
Responsibles: ["tarum", "niknik"]
}
Factor {
Index: 261
CppName: "FI_URL_QUERY_VARIETY"
Name: "UrlQueryVariety"
Tags: [TG_STATIC, TG_DOC, TG_USER, TG_USER_SEARCH, TG_USER_EXT_DATA, TG_REARR_USE, TG_L2, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_CLICKS_SHOWS, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Description: "How different are queries that were used by visitors clicked on the URL in SERP"
Wiki: "<https://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/Kliki#urlqueryvarietyreg>"
Authors: "akhropov"
Responsibles: ["tarum", "niknik"]
}
Factor {
Index: 262
CppName: "FI_IS_COMM_BY_KEYWORDS"
Name: "IsCommByKeywords"
Tags: [TG_STATIC, TG_DEPRECATED]
Description: "The page is commercial by keywords. It is not being used (deprecated)"
Authors: "denplusplus"
Responsibles: "alsafr"
}
Factor {
Index: 263
CppName: "FI_DOC_TFIDF_SUM"
Name: "DocIdfSum_broken"
Tags: [TG_STATIC, TG_DEPRECATED, TG_L2]
Description: "Idf on various document parts, broken and not being used"
Authors: "melton"
Responsibles: "melton"
}
Factor {
Index: 264
CppName: "FI_TITLE_IDF_SUM"
Name: "TitleIdfSum_broken"
Tags: [TG_STATIC, TG_DEPRECATED, TG_L2]
Description: "Idf on various document parts, broken and not being used"
Authors: "melton"
Responsibles: "melton"
}
Factor {
Index: 265
CppName: "FI_HEADING_IDF_SUM"
Name: "HeadingIdfSum_broken"
Tags: [TG_STATIC, TG_DEPRECATED, TG_L2]
Description: "Idf on various document parts, broken and not being used"
Authors: "melton"
Responsibles: "melton"
}
Factor {
Index: 266
CppName: "FI_NORMAL_TEXT_IDF_SUM"
Name: "NormalTextIdfSum_broken"
Tags: [TG_STATIC, TG_DEPRECATED, TG_L2]
Description: "Idf on various document parts, broken and not being used"
Authors: "melton"
Responsibles: "melton"
}
Factor {
Index: 267
CppName: "FI_LR_VIDEO_RELEV"
Name: "XLRVideoRelev"
Group: "Xref"
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_DEPRECATED]
Description: "A link factor based on the video presence on the page."
Authors: "vnik"
Responsibles: "vnik"
}
Factor {
Index: 268
CppName: "FI_AUX_TEXT_BM25"
Name: "AuxTextBM25"
AntiSeoUpperBound: 0.8
Group: "AuxBM25"
Tags: [TG_DOC_TEXT, TG_DYNAMIC, TG_LOCALIZED_CITY, TG_REARR_USE, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_DEPRECATED]
Description: "BM25 by user's region for localizable queries; and the country for non-localizable queries in KUB. The texts of sent queries for regions can be viewed in relev_regions.txt in the Sorcerer (algorithm name)"
Authors: "denplusplus"
Responsibles: "alsafr"
}
Factor {
Index: 269
CppName: "FI_AUX_LINK_BM25"
Name: "AuxLinkBM25"
AntiSeoUpperBound: 0.8
Group: "AuxBM25"
Tags: [TG_DYNAMIC, TG_LOCALIZED_CITY, TG_LINK_TEXT, TG_REARR_USE, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_DEPRECATED]
Description: "It's the same for link relevance"
Authors: "denplusplus"
Responsibles: "alsafr"
}
Factor
Index: 270
CppName: "FI_COMM_LINKS_SEO_HOSTS"
Name: "CommLinksSEOHosts"
AntiSeoUpperBound: 1.0
Tags: [TG_COMMERCIAL, TG_LINK_GRAPH, TG_OWNER, TG_STATIC, TG_OFTEN_ZERO, TG_L2, TG_DEPRECATED]
Description: "Percentage of links that were bought. The algorithm for recognizing links that were bought has been implemented. The factor is remapped to [0,1] if the share of such links is > 50%, otherwise it's 0. ((<http://wiki.yandex-team.ru/SvetlanaShorina/topseolinks> a selection of boosted websites))"
Authors: "kvn"
Responsibles: "sisoid"
}
Factor {
Index: 271
CppName: "FI_COMM_LINKS_SEO_HOSTS_PORNO_QUERY"
Name: "CommLinksSEOHostsPornoQuery"
AntiSeoUpperBound: 1.0
Tags: [TG_COMMERCIAL, TG_LINK_GRAPH, TG_OWNER, TG_DYNAMIC, TG_THEME_CLASSIF, TG_DEPRECATED, TG_OFTEN_ZERO, TG_L2]
Description: "The previous factor multiplied by PornoQuery"
Authors: "kvn"
Responsibles: "sisoid"
}
Factor {
Index: 272
CppName: "FI_COMM_LINKS_SEO_HOSTS_NON_COMM"
Name: "CommLinksSEOHostsNonComm"
AntiSeoUpperBound: 1.0
Tags: [TG_COMMERCIAL, TG_LINK_GRAPH, TG_OWNER, TG_DYNAMIC, TG_OFTEN_ZERO, TG_L2, TG_DEPRECATED]
Description: "The CommLinksSEOHosts factor multiplied by NonCommercialQuery"
Authors: "kvn"
Responsibles: "sisoid"
}
Factor {
Index: 273
CppName: "FI_TOVAR_CATEGORY_QUERY"
Name: "TovarCategoryQuery"
DependsOn: [{Feature: ["TovarCategoryQuery"], Slice: "begemot_query_factors"}]
Group: "Query"
AntiSeoUpperBound: 1.0
Tags: [TG_COMMERCIAL, TG_QUERY_ONLY, TG_DYNAMIC, TG_REARR_USE, TG_DEPRECATED, TG_OFTEN_ZERO, TG_L2]
Description: "The query mentions a product category. It’s not being used (deprecated)"
Responsibles: "alsafr"
}
Factor {
Index: 274
CppName: "FI_TOVAR_VENDOR_QUERY"
Name: "TovarCategoryVendor"
DependsOn: [{Feature: ["TovarCategoryVendor"], Slice: "begemot_query_factors"}]
Group: "Query"
AntiSeoUpperBound: 1.0
Tags: [TG_COMMERCIAL, TG_QUERY_ONLY, TG_DYNAMIC, TG_REARR_USE, TG_DEPRECATED, TG_OFTEN_ZERO, TG_L2]
Description: "The query mentions a vendor. It is not being used (deprecated)"
Responsibles: "alsafr"
}
Factor {
Index: 275
CppName: "FI_Q_DIVERSITY2"
Name: "Diversity2"
DependsOn: [{Feature: ["Diversity2"], Slice: "begemot_query_factors"}]
Group: "Query"
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_REARR_USE, TG_OFTEN_ZERO, TG_L2, TG_USERFEAT, TG_USERFEAT_90D, TG_DEPRECATED]
Description: "The geographic distribution of the query"
Wiki: "<http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/Diversity2>"
Authors: "denplusplus"
Responsibles: ["tarum", "niknik"]
}
Factor {
Index: 276
CppName: "FI_NIGHT_QUERY"
Name: "NightQuery"
DependsOn: [{Feature: ["NightQuery"], Slice: "begemot_query_factors"}]
Group: "Query"
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_BINARY, TG_REARR_USE, TG_OFTEN_ZERO, TG_L2, TG_DEPRECATED]
Description: "The query is used mainly at night"
Wiki: "<http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/HourDiversity>"
Authors: "denplusplus"
Responsibles: ["diver", "akhropov"]
}
Factor {
Index: 277
CppName: "FI_MORNING_QUERY"
Name: "MorningQuery"
DependsOn: [{Feature: ["MorningQuery"], Slice: "begemot_query_factors"}]
Group: "Query"
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_BINARY, TG_REARR_USE, TG_OFTEN_ZERO, TG_L2, TG_DEPRECATED]
Description: "The query is used mainly in the morning"
Wiki: "<http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/HourDiversity>"
Authors: "denplusplus"
Responsibles: ["diver", "akhropov"]
}
Factor {
Index: 278
CppName: "FI_DAY_QUERY"
Name: "DayQuery"
DependsOn: [{Feature: ["DayQuery"], Slice: "begemot_query_factors"}]
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_BINARY, TG_REARR_USE, TG_L2, TG_DEPRECATED]
Group: "Query"
Description: "The query is used mainly in the afternoon"
Wiki: "<http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/HourDiversity>"
Authors: "denplusplus"
Responsibles: ["diver", "akhropov"]
}
Factor {
Index: 279
CppName: "FI_EVENING_QUERY"
Name: "EveningQuery"
DependsOn: [{Feature: ["EveningQuery"], Slice: "begemot_query_factors"}]
Group: "Query"
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_BINARY, TG_REARR_USE, TG_OFTEN_ZERO, TG_L2, TG_DEPRECATED]
Description: "The query is used mainly in the evening"
Wiki: "<http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/HourDiversity>"
Authors: "denplusplus"
Responsibles: ["diver", "akhropov"]
}
Factor {
Index: 280
CppName: "FI_HOUR_DIVERSITY"
Name: "HourDiversity"
DependsOn: [{Feature: ["HourDiversity"], Slice: "begemot_query_factors"}]
Group: "Query"
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_REARR_USE, TG_OFTEN_ZERO, TG_L2, TG_USERFEAT, TG_USERFEAT_90D, TG_DEPRECATED]
Description: "How different is time of the day of used queries"
Wiki: "<http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/HourDiversity>"
Authors: "denplusplus"
Responsibles: ["tarum", "niknik"]
}
Factor {
Index: 281
CppName: "FI_LCOR"
Name: "LCor"
Group: "Dynamic"
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_REARR_USE, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_DEPRECATED]
Description: "It measures the frequency of words in links. The factor is more important if the word that played in the link relevance is rare for links."
Authors: "denplusplus"
Responsibles: "alsafr"
}
Factor {
Index: 282
CppName: "FI_SUBQUERY_THEME_MATCH_A"
Name: "SubqueryThMatchA"
Tags: [TG_DOC, TG_DYNAMIC, TG_THEME_CLASSIF, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_DEPRECATED]
Description: "The topic of the query and the document are matching. The topic of the query is the work result. ((<http://wiki.yandex-team.ru/EvgenijjKroxalev/subquery> the sorcerer’s (algorithms name) rules SubquerySearch )) The topic of the document is determined by an automatic classifier"
Authors: ["ekrokhalev", "pyal"]
Responsibles: ["pyal", "lamo"]
}
Factor {
Index: 283
CppName: "FI_TR_DOCQUORUM"
Name: "TRDocQuorum"
Group: "Dynamic"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: "The weight of query words that are present in the text"
Authors: "denplusplus"
Responsibles: "alsafr"
}
Factor {
Index: 284
CppName: "FI_LR_DOCQUORUM"
Name: "LRDocQuorum"
Group: "Dynamic"
Tags: [TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_UNUSED, TG_DEPRECATED]
Description: "The weight of query words that are present in the links"
Authors: "denplusplus"
Responsibles: "alsafr"
}
Factor {
Index: 285
CppName: "FI_TRLR_DOCQUORUM"
Name: "TRLRDocQuorum"
Group: "Dynamic"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: "The weight of query words that are present in the text and links"
Authors: "denplusplus"
Responsibles: "alsafr"
}
Factor {
Index: 286
CppName: "FI_OWNER_SDIFF_CLICK_ENTROPY"
Name: "OwnerSDiffClickEntropy"
Tags: [TG_STATIC, TG_OWNER, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_L2, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_CLICKS_SHOWS, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Description: "The entropy - the distribution of clicks"
Wiki: "<http://wiki.yandex-team.ru/YandexLabsDev/MLRFeatureResearch/OwnerClick>"
Authors: ["cliff", "akhropov"]
Responsibles: ["tarum", "niknik"]
}
Factor {
Index: 287
CppName: "FI_OWNER_SDIFF_SHOW_ENTROPY"
Name: "OwnerSDiffShowEntropy"
Tags: [TG_STATIC, TG_OWNER, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_L2, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_CLICKS_SHOWS, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Description: "The entropy - the distribution of impressions"
Wiki: "<http://wiki.yandex-team.ru/YandexLabsDev/MLRFeatureResearch/OwnerClick>"
Authors: ["cliff", "akhropov"]
Responsibles: ["tarum", "niknik"]
}
Factor {
Index: 288
CppName: "FI_OWNER_SDIFF_CSRATIO_ENTROPY"
Name: "OwnerSDiffCSRatioEntropy"
Tags: [TG_STATIC, TG_OWNER, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_L2, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_CLICKS_SHOWS, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Description: "The entropy - the ratio between clicks and impressions"
Wiki: "<http://wiki.yandex-team.ru/YandexLabsDev/MLRFeatureResearch/OwnerClick>"
Authors: ["cliff", "akhropov"]
Responsibles: ["tarum", "niknik"]
}
Factor {
Index: 289
CppName: "FI_PORNO_LR_LOG_RELEV"
Name: "XPornoLRlogRelev"
Group: "Xref"
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: "A porn document based on the text of the links"
Authors: "somov"
Responsibles: "somov"
}
Factor {
Index: 290
CppName: "FI_PORNO_NORM_LR_LOG_RELEV"
Name: "XPornoNormLRlogRelev"
Group: "Xref"
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_REARR_USE, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: "A porn document based on the text of the links, another normalization"
Responsibles: "alsafr"
}
Factor {
Index: 291
CppName: "FI_XPORNO_QUERY"
Name: "XPornoQuery"
DependsOn: [{Feature: ["XPornoQuery"], Slice: "begemot_query_factors"}]
Group: "Query"
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_THEME_CLASSIF, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_DEPRECATED]
Description: "The classifier of porn queries, another dictionary that differs from PornoQuery"
Responsibles: "alsafr"
UseArtifact: {Name: "PornoQueryList"}
}
Factor {
Index: 292
CppName: "FI_ALICE_MUSIC_ALBUM_TITLE_ATTENV1_BM15_K05"
Name: "AliceMusicAlbumTitleAttenV1_Bm15_K05"
Tags: [TG_UNUSED, TG_DYNAMIC, TG_DOC, TG_ALICE_MUSIC, TG_ANNOTATION_NOFILTER, TG_TEXT_MACHINE, TG_ALLOW_USE_FOR_ALICE]
Description: "The AttenV1_Bm15_K05 factor value for the AliceMusic stream"
Wiki: "<https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/lingboost>"
Ticket: ["BUKI-2932"]
Authors: "anrodigina"
Responsibles: ["anrodigina", "gotmanov", "hommforever"]
ImplementationTime: "2020-03-11"
}
Factor {
Index: 293
CppName: "FI_GEO_COUNTRY_COUNTRY_PROXIM"
Name: "GeoCountryCountryProxim"
Tags: [TG_DYNAMIC, TG_LOCALIZED_COUNTRY, TG_HOST, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The geographic closeness of the website country and the query country"
Authors: "denplusplus"
Responsibles: "alsafr"
}
Factor {
Index: 294
CppName: "FI_URL_DOMAIN_FRACTION"
Name: "UrlDomainFraction"
Group: "Dynamic"
Wiki: "<http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/UrlTrigramFraction>"
Tags: [TG_HOST, TG_DYNAMIC, TG_URL_TEXT, TG_REARR_USE, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE, TG_FORMULA_2245_DEP_2, TG_DEPRECATED]
Description: "Domain coverage with the three letters from the query. (Chelyabinsk lottery is chelloto. We convert the query using transliteration, find the three letters that are covered (che, hel, lot, olo), and check what part of all the three-letter combos is covered)”
Authors: ["cliff", "melton"]
Responsibles: ["tsimkha", "melton"]
}
Factor {
Index: 295
CppName: "FI_URL_PATH_AND_PARAMS_FRACTION"
Name: "UrlPathAndParamsFraction"
Wiki: "<http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/UrlTrigramFraction>"
Tags: [TG_DOC, TG_DYNAMIC, TG_URL_TEXT, TG_REARR_USE, TG_L2, TG_NN_OVER_FEATURES_USE, TG_FORMULA_2245_DEP_2, TG_DEPRECATED]
Description: "It’s the same as the previous factor but it’s about the whole URL except for the domain"
Responsibles: ["tsimkha", "alsafr"]
}
Factor {
Index: 296
CppName: "FI_SPECIFICAL_QUERY"
Name: "SpecificalQuery"
Group: "Query"
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_BINARY, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_NN_OVER_FEATURES_USE]
Description: "The query is locally specific. The query is often reformulated with an explicit region specification. ((<https://ml.yandex-team.ru/archive/thread1433892/#message1433892> in more detail))"
Authors: "denplusplus"
Responsibles: "alsafr"
}
Factor {
Index: 297
CppName: "FI_JOKER_LEN"
Name: "JokerLen"
Ticket: "BUKI-705"
Group: "CombinedSequences"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_DEPRECATED]
Description: "We count text features, assuming that the title of the page is assigned to each of its sentences, i.e. the distance between the word from the title and any other word is 1 sentence. Len is the maximum ratio of words from the query found in some sentence of the text (with the assigned title) in relation to the length of the query. This is the example [Harms circus Vertunov] for ((<http://wiki.yandex-team.ru//h.yandex.net/?http%3A%2F%2Fwww.wikilivres.info%2Fwiki%2F%25D0%25A6%25D0%25B8%25D1%2580%25D0%25BA_%25D0%25A8%25D0%25B0%25D1%2580%25D0%25B4%25D0%25B0%25D0%25BC_%28%25D0%25A5%25D0%25B0%25D1%2580%25D0%25BC%25D1%2581%29> of this document))"
Authors: "styskin"
Responsibles: "styskin"
}
Factor {
Index: 298
CppName: "FI_JOKER_WEIGHT"
Name: "JokerWeight"
Group: "CombinedSequences"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_DEPRECATED]
Description: "The ratio of the idf sum of the words encountered in the sentence + title for all words."
Responsibles: "alsafr"
}
Factor {
Index: 299
CppName: "FI_EXACT_JOKER_LEN"
Name: "ExactJokerLen"
Group: "CombinedSequences"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_DEPRECATED]
Description: "It’s the same as JokerLen, based on exact forms"
Responsibles: "alsafr"
}
Factor {
Index: 300
CppName: "FI_EXACT_JOKER_WEIGHT"
Name: "ExactJokerWeight"
Group: "CombinedSequences"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_DEPRECATED]
Description: "It’s the same as JokerWeight, based on exact forms"
Responsibles: "alsafr"
}
Factor {
Index: 301
CppName: "FI_MORE_120_SEC_VISITS_NOT_SEARCH_SHARE"
Name: "More120SecVisitsNotSearchShare"
Tags: [TG_OWNER, TG_STATIC, TG_OFTEN_ZERO, TG_COMMERCIAL, TG_NN_OVER_FEATURES_USE]
Description: "Remapped mascot feature More120SecVisitsNotSearchShare"
Ticket: "SEARCHSPAM-15531"
Authors: ["bikulov"]
Responsibles: ["bikulov", "sdormidontov"]
ImplementationTime: "2020-09-30"
}
Factor {
Index: 302
CppName: "FI_LINK_BREAK"
Name: "LnkBreak"
Group: "LinkBM25"
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_L2, TG_DEPRECATED]
Description: "The analogues of the corresponding text factors for links. BM25 of the number of matched links."
Authors: "gulin"
Responsibles: "gulin"
}
Factor {
Index: 303
CppName: "FI_LINK_BM25_EX"
Name: "LnkBm25Ex"
Group: ["LinkBM25", "Dynamic"]
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_L2, TG_DEPRECATED]
Description: "A simple BM25 based on the exact form in link texts"
Responsibles: "alsafr"
}
Factor {
Index: 304
CppName: "FI_LINK_PAIR_SYN"
Name: "LnkPairSy"
Group: "LinkBM25"
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_L2, TG_DEPRECATED]
Description: "The presence of pairs of words in links including synonyms"
Responsibles: "alsafr"
}
Factor {
Index: 305
CppName: "FI_LINK_BREAK_SYN"
Name: "LnkBrkSy"
Group: "LinkBM25"
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_L2, TG_DEPRECATED]
Description: "The number of links that passed the limit"
Responsibles: "alsafr"
}
Factor {
Index: 306
CppName: "FI_LINK_BM25_SYN"
Name: "LnkBm25Sy"
Group: ["LinkBM25", "Dynamic"]
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_L2, TG_DEPRECATED]
Description: "A simple BM25 on links including synonyms"
Responsibles: "alsafr"
}
Factor {
Index: 307
CppName: "FI_IS_VIDEO_QUERY"
Name: "VideoQuery"
DependsOn: [{Feature: ["VideoQuery"], Slice: "begemot_query_factors"}]
Group: "Query"
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_THEME_CLASSIF, TG_BINARY, TG_REARR_USE, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_DEPRECATED]
Description: "A video query"
Responsibles: "alsafr"
}
Factor {
Index: 308
CppName: "FI_OWNER_CLICKS_PCTR_REG"
Name: "OwnerClicksPCTR_Reg"
Tags: [TG_STATIC, TG_OWNER, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_OFTEN_ZERO, TG_L2, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_CLICKS_SHOWS, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Countries: CNT_RELEV
Group: "RegHostStatic"
Description: "The clickability of the owner regardless of the request, independently by region"
Wiki: "<http://wiki.yandex-team.ru/ЯндексПоиск/КачествоПоиска/Клики#ownerclickspctrreg>"
Authors: "akhropov"
Responsibles: ["tarum", "niknik"]
}
Factor {
Index: 309
CppName: "FI_OWNER_SDIFF_CLICK_ENTROPY_REG"
Name: "OwnerSDiffClickEntropy_Reg"
Group: "RegHostStatic"
Tags: [TG_STATIC, TG_OWNER, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_L2, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_CLICKS_SHOWS, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Countries: CNT_RELEV
Description: "The entropy - the distribution of clicks. It is regionalized"
Wiki: "<http://wiki.yandex-team.ru/YandexLabsDev/MLRFeatureResearch/OwnerClick>"
Authors: "akhropov"
Responsibles: ["tarum", "niknik"]
}
Factor {
Index: 310
CppName: "FI_OWNER_SDIFF_SHOW_ENTROPY_REG"
Name: "OwnerSDiffShowEntropy_Reg"
Group: "RegHostStatic"
Tags: [TG_STATIC, TG_OWNER, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_L2, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_CLICKS_SHOWS, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Countries: CNT_RELEV
Description: "The entropy - the distribution of impressions. It is regionalized"
Wiki: "<http://wiki.yandex-team.ru/YandexLabsDev/MLRFeatureResearch/OwnerClick>"
Authors: "akhropov"
Responsibles: ["tarum", "niknik"]
}
Factor {
Index: 311
CppName: "FI_OWNER_SDIFF_CSRATIO_ENTROPY_REG"
Name: "OwnerSDiffCSRatioEntropy_Reg"
Group: "RegHostStatic"
Tags: [TG_STATIC, TG_OWNER, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_L2, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_CLICKS_SHOWS, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Countries: CNT_RELEV
Description: "The entropy - the distribution of the click/impressions ratio. It is regionalized"
Wiki: "<http://wiki.yandex-team.ru/YandexLabsDev/MLRFeatureResearch/OwnerClick>"
Authors: "akhropov"
Responsibles: ["tarum", "niknik"]
}
Factor {
Index: 312
CppName: "FI_ADULTNESS"
Name: "Adultness"
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_THEME_CLASSIF, TG_DEPRECATED, TG_OFTEN_ZERO, TG_L2]
Description: "equals 2 * NastyContent"
Wiki: "<http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/Adultness>"
Authors: "melton"
Responsibles: "snow"
}
Factor {
Index: 313
CppName: "FI_HOST_ADULTNESS"
Name: "HostAdultness"
Tags: [TG_HOST, TG_STATIC, TG_THEME_CLASSIF, TG_DEPRECATED, TG_OFTEN_ZERO, TG_L2]
Description: "equals 2 * NastyContent"
Wiki: "<http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/HostAdultness>"
Responsibles: "snow"
}
Factor {
Index: 314
CppName: "FI_KC_HOST_ADULTNESS"
Name: "KCHostAdultness"
Tags: [TG_HOST, TG_STATIC, TG_THEME_CLASSIF, TG_BINARY, TG_DEPRECATED, TG_OFTEN_ZERO]
Description: "always zero"
Wiki: "<http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/KCHostAdultness>"
Responsibles: "snow"
}
Factor {
Index: 315
CppName: "FI_IS_COM"
Name: "IsCom"
Wiki: "<http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/DomainZone>"
Tags: [TG_HOST, TG_STATIC, TG_URL_TEXT, TG_BINARY, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The domain is in the .com zone"
Authors: "somov"
Responsibles: ["tsimkha", "alsafr"]
}
Factor {
Index: 316
CppName: "FI_IS_UA"
Name: "IsUa"
Wiki: "<http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/DomainZone>"
Tags: [TG_HOST, TG_STATIC, TG_URL_TEXT, TG_BINARY, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The domain is in the .ua zone"
Authors: "somov"
Responsibles: ["tsimkha", "alsafr"]
}
Factor {
Index: 317
CppName: "FI_IS_NOT_RU"
Name: "IsNotRu"
Wiki: "<http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/DomainZone>"
Tags: [TG_HOST, TG_STATIC, TG_URL_TEXT, TG_BINARY, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The domain is not in the .ru zone"
Authors: "somov"
Responsibles: ["tsimkha", "alsafr"]
}
Factor {
Index: 318
CppName: "FI_LR_MARKET_RELEV"
Name: "XLRMarketRelev"
AntiSeoUpperBound: 1.0
Group: "Xref"
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_DEPRECATED]
Description: "LR based on links from Yandex.Market"
Authors: "gulin"
Responsibles: "gulin"
}
Factor {
Index: 319
CppName: "FI_POETRY"
Name: "Poetry"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/OpisanijaFaktorov#h20931-18>"
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_REARR_USE, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The poetry level of the document"
Authors: "vnik"
Responsibles: "vnik"
}
Factor {
Index: 320
CppName: "FI_POETRY_QUAD"
Name: "PoetryQuad"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/OpisanijaFaktorov#h20931-18>"
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_REARR_USE, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The maximum poetry level of the quatrain"
Authors: "vnik"
Responsibles: "vnik"
}
Factor {
Index: 321
CppName: "FI_ENG_LANG"
Name: "EngLang"
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_BINARY, TG_REARR_USE, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The document language is English"
Responsibles: "alsafr"
}
Factor {
Index: 322
CppName: "FI_DOC_HAS_TWO_EXACT_QUERY_PARTS"
Name: "Has2ExactQueryParts"
Group: "ExactGroups"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_BINARY, TG_REARR_USE, TG_UNDOCUMENTED, TG_NN_OVER_FEATURES_USE]
Description: "The query is completely covered by the two exact groups consisting of the exact match query words in a row((<http://wiki.yandex-team.ru/poiskovajaplatforma/tr/CoverageByGroups> About the coverage by the groups))"
Authors: ["finder", "gruntova"]
Responsibles: "finder"
}
Factor {
Index: 323
CppName: "FI_DOC_HAS_LEVENSHT1_QUERY_FRAGMENT"
Name: "HasLevensht1QueryFragment"
Group: "ExactGroups"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_BINARY, TG_REARR_USE, TG_UNDOCUMENTED, TG_NN_OVER_FEATURES_USE]
Description: "There is a group which consists of the exact match query words, covering the query (possibly with omission, addition, or replacement of the word)"
Authors: ["finder", "gruntova"]
Responsibles: "finder"
}
Factor {
Index: 324
CppName: "FI_LARGEST_SY_INEXACT_GROUP"
Name: "LargestSyInexactGroup"
Group: "ExactGroups"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_NN_OVER_FEATURES_USE]
Description: "The percentage of the query covered by the longest group which consists of any hits (including word forms and synonyms). Possibly with an omission, addition, or replacement of a word"
Authors: ["finder", "gruntova"]
Responsibles: "finder"
}
Factor {
Index: 325
CppName: "FI_TIME_PROFILES_MATCH_WD"
Name: "TimeProfilesMatchWD"
Tags: [TG_DYNAMIC, TG_DOC, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_BINARY, TG_DEPRECATED, TG_OFTEN_ZERO]
Description: "It describes the proximity of time profiles of the query and documents on working days"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/TimeProfilesMatch>"
Authors: "akorsun"
Responsibles: "alsafr"
}
Factor {
Index: 326
CppName: "FI_TIME_PROFILES_MATCH_WE"
Name: "TimeProfilesMatchWE"
Tags: [TG_DYNAMIC, TG_DOC, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_BINARY, TG_DEPRECATED, TG_OFTEN_ZERO]
Description: "It describes the proximity of time profiles of the query and documents on weekends"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/TimeProfilesMatch>"
Authors: "akorsun"
Responsibles: "alsafr"
}
Factor {
Index: 327
CppName: "FI_CYR_LANG"
Name: "CyrLang"
Wiki: "<https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/CyrLang>"
AntiSeoUpperBound: 1.0
Tags: [TG_BINARY, TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_REARR_USE, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The document language is Cyrillic"
Responsibles: "pavelgur"
}
Factor {
Index: 328
CppName: "FI_REGIONAL_U_QUERY"
Name: "GeoRegionalityU"
DependsOn: [{Feature: ["GeoRegionalityU"], Slice: "begemot_query_factors"}]
Group: "Query"
Tags: [TG_QUERY_ONLY, TG_DYNAMIC, TG_THEME_CLASSIF, TG_DEPRECATED, TG_L2]
Description: "The request factors are the result of work ((<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/GeoRegionality> the query geolocalization classifier))U- geo-useless - the regional query results are meaningless"
Responsibles: "esoloviev"
}
Factor {
Index: 329
CppName: "FI_REGIONAL_R_QUERY"
Name: "GeoRegionalityR"
DependsOn: [{Feature: ["GeoRegionalityR"], Slice: "begemot_query_factors"}]
Group: "Query"
Tags: [TG_QUERY_ONLY, TG_DYNAMIC, TG_THEME_CLASSIF, TG_DEPRECATED, TG_L2]
Description: "R- geo-relevant - the regional query results could be useful, but it’s nothing more than that"
Authors: "esoloviev"
Responsibles: "esoloviev"
}
Factor {
Index: 330
CppName: "FI_REGIONAL_V_QUERY"
Name: "GeoRegionalityV"
DependsOn: [{Feature: ["GeoRegionalityV"], Slice: "begemot_query_factors"}]
Group: "Query"
Tags: [TG_QUERY_ONLY, TG_DYNAMIC, TG_THEME_CLASSIF, TG_DEPRECATED, TG_L2]
Description: "V- geo-vital - the regional SERP is essential"
Authors: "esoloviev"
Responsibles: "esoloviev"
}
Factor {
Index: 331
CppName: "FI_URL_HAS_NO_DIGITS"
Name: "UrlHasNoDigits"
Tags: [TG_DOC, TG_STATIC, TG_URL_TEXT, TG_BINARY, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The URL does not contain numbers"
Authors: "melton"
Responsibles: "melton"
}
Factor {
Index: 332
CppName: "FI_ALICE_MUSIC_TRACK_ARTIST_NAMES_ALL_WCM_MAX_MATCH"
Name: "AliceMusicTrackArtistNamesAllWcmMaxMatch"
Tags: [TG_UNUSED, TG_DYNAMIC, TG_DOC, TG_ALICE_MUSIC, TG_ANNOTATION_NOFILTER, TG_TEXT_MACHINE, TG_ALLOW_USE_FOR_ALICE]
Description: "The AllWcmMaxMatch factor value for the AliceMusic stream"
Wiki: "<https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/lingboost>"
Ticket: ["BUKI-2932"]
Authors: "anrodigina"
Responsibles: ["anrodigina", "gotmanov", "hommforever"]
ImplementationTime: "2020-03-11"
}
Factor {
Index: 333
CppName: "FI_ALICE_MUSIC_TRACK_ALBUM_TITLE_COSINE_MATCH_MAX_PREDICTION"
Name: "AliceMusicTrackAlbumTitleCosineMatchMaxPrediction"
Tags: [TG_UNUSED, TG_DYNAMIC, TG_DOC, TG_ALICE_MUSIC, TG_ANNOTATION_NOFILTER, TG_TEXT_MACHINE, TG_ALLOW_USE_FOR_ALICE]
Description: "The CosineMatchMaxPrediction factor value for the AliceMusic stream"
Wiki: "<https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/lingboost>"
Ticket: ["BUKI-2932"]
Authors: "anrodigina"
Responsibles: ["anrodigina", "gotmanov", "hommforever"]
ImplementationTime: "2020-03-11"
}
Factor {
Index: 334
CppName: "FI_SYN_S1"
Name: "SynS1"
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "They show how unnatural the text is in terms of Russian language grammar. It’s the evaluation of how much the document text can be considered as generated by a synonymizer or even automatically.
((<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/antispam?v=1il#h58953-2> in more detail))"
Authors: "grechnik"
Responsibles: "grechnik"
}
Factor {
Index: 335
CppName: "FI_SYN_FL_REMAP1"
Name: "SynFLremap1"
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "They show how unnatural the text is in terms of Russian language grammar. It’s the evaluation of how much the document text can be considered as generated by a synonymizer or even automatically. ((<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/antispam?v=1il#h58953-2> in more detail))"
Authors: "grechnik"
Responsibles: "grechnik"
}
Factor {
Index: 336
CppName: "FI_SYN_FL_REMAP2"
Name: "SynFLremap2"
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "They show how unnatural the text is in terms of Russian language grammar. It’s the evaluation of how much the document text can be considered as generated by a synonymizer or even automatically. ((<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/antispam?v=1il#h58953-2> in more detail))"
Authors: "grechnik"
Responsibles: "grechnik"
}
Factor {
Index: 337
CppName: "FI_OWNER_SESS_NORM_DUR"
Name: "OwnerSessNormDuration"
Tags: [TG_STATIC, TG_OWNER, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_REARR_USE, TG_L2, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_90D, TG_USERFEAT_USF, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Description: "nd/k The normalized time before the click"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty#polzovatelskiesessii>"
Authors: ["cliff", "akhropov", "angshu"]
Responsibles: ["tarum", "niknik"]
}
Factor {
Index: 338
CppName: "FI_URL_SESS_NORM_DUR_RATE"
Name: "UrlSessNormDurRate"
Tags: [TG_STATIC, TG_DOC, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_REARR_USE, TG_L2, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_90D, TG_USERFEAT_USF, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Description: "nd/i"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty#polzovatelskiesessii>"
Authors: ["cliff", "akhropov", "angshu"]
Responsibles: ["tarum", "niknik"]
}
Factor {
Index: 339
CppName: "FI_QUERY_DOWNER_SESS_NORM_DUR"
Name: "QueryDOwnerSessNormDuration"
Tags: [TG_DYNAMIC, TG_DOWNER, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_USER_SEARCH_EXTERNAL, TG_REARR_USE, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_90D, TG_USERFEAT_USF, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Countries: CNT_RELEV
Description: "nd/k"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty#polzovatelskiesessii>"
Authors: ["cliff", "akhropov", "angshu"]
Responsibles: ["tarum", "niknik"]
}
Factor {
Index: 340
CppName: "FI_QUERY_DOWNER_WEIGHT_CLICK"
Name: "QueryDOwnerWeightClick"
Tags: [TG_DYNAMIC, TG_DOWNER, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_USER_SEARCH_EXTERNAL, TG_REARR_USE, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_90D, TG_USERFEAT_USF, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Countries: CNT_RELEV
Description: "w/k"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty#polzovatelskiesessii>"
Authors: ["cliff", "akhropov", "angshu"]
Responsibles: ["tarum", "niknik"]
}
Factor {
Index: 341
CppName: "FI_QUERY_DOWNER_ONLY_CLICK_RATE"
Name: "QueryDOwnerOnlyClickRate"
Tags: [TG_DYNAMIC, TG_DOWNER, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_USER_SEARCH_EXTERNAL, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_90D, TG_USERFEAT_USF, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Countries: CNT_RELEV
Description: "o/i"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty#polzovatelskiesessii>"
Authors: ["cliff", "akhropov", "angshu"]
Responsibles: ["tarum", "niknik"]
}
Factor {
Index: 342
CppName: "FI_QUERY_DOWNER_CLICK_SUMMARY"
Name: "QueryDOwnerClickSummary"
Ticket: "BUKI-955"
Tags: [TG_DYNAMIC, TG_DOWNER, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_USER_SEARCH_EXTERNAL, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_90D, TG_USERFEAT_USF, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Countries: CNT_RELEV
Description: "The selected formula"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty#polzovatelskiesessii>"
Authors: ["akhropov", "angshu", "cliff", "popescul"]
Responsibles: ["tarum", "niknik"]
}
Factor {
Index: 343
CppName: "FI_QUERY_DOWNER_SATISFIED4_RATE"
Name: "QueryDOwnerSatisfied4Rate"
Ticket: "BUKI-955"
Tags: [TG_DYNAMIC, TG_DOWNER, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_USER_SEARCH_EXTERNAL, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_90D, TG_USERFEAT_USF, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Countries: CNT_RELEV
Description: "r_s4b/(r_k + 10)"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty#polzovatelskiesessii>"
Authors: ["akhropov", "angshu", "cliff", "popescul"]
Responsibles: ["tarum", "niknik"]
}
Factor {
Index: 344
CppName: "FI_SYNT_QUALITY"
Name: "SyntQuality"
Wiki: "<http://wiki.yandex-team.ru/PoiskovajaPlatforma/Lingvistika/SyntaxInQueries/SyntFactors/IsSynt>"
Group: "Query"
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "Does the query contain a full sentence analysis?"
Authors: "zador"
Responsibles: "zador"
}
Factor {
Index: 345
CppName: "FI_PAGE_DATE"
Name: "PageDate"
Group: "Datetime"
Tags: [TG_DATE, TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The document date that is written on the page is remapped with a square root"
Responsibles: "alsafr"
}
Factor {
Index: 346
CppName: "FI_VISITS_P_VISITORS"
Name: "VisitsPVisitors"
Tags: [TG_OWNER, TG_STATIC, TG_OFTEN_ZERO, TG_COMMERCIAL, TG_NN_OVER_FEATURES_USE]
Description: "Remapped mascot feature VisitsPVisitors"
Ticket: "SEARCHSPAM-15531"
Authors: ["bikulov"]
Responsibles: ["bikulov", "sdormidontov"]
ImplementationTime: "2020-09-30"
}
Factor {
Index: 347
CppName: "FI_RINGS_HOST_RANK_BADNESS_2"
Name: "RingsHostRankBadness2"
Tags: [TG_LINK_GRAPH, TG_OWNER, TG_STATIC, TG_BINARY, TG_DEPRECATED]
Description: "The additional factors about the website growth thanks to link circles, ((<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/antispam?v=181r#h58953-4> in more detail))"
Authors: ["denplusplus", "raigorodsky"]
Responsibles: ["raigorodsky", "alsafr"]
}
Factor {
Index: 348
CppName: "FI_RINGS_HOST_RANK_BADNESS_3"
Name: "RingsHostRankBadness3"
Tags: [TG_LINK_GRAPH, TG_OWNER, TG_STATIC, TG_DEPRECATED]
Description: "The additional factors about the website growth thanks to link circles, ((<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/antispam?v=181r#h58953-4> in more detail))"
Authors: ["denplusplus", "raigorodsky"]
Responsibles: ["raigorodsky", "alsafr"]
}
Factor {
Index: 349
CppName: "FI_RINGS_HOST_RANK_BADNESS_4"
Name: "RingsHostRankBadness4"
Tags: [TG_LINK_GRAPH, TG_OWNER, TG_STATIC, TG_BINARY, TG_DEPRECATED]
Description: "The additional factors about the website growth thanks to link circles, ((<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/antispam?v=181r#h58953-4> in more detail))"
Authors: ["denplusplus", "raigorodsky"]
Responsibles: ["raigorodsky", "alsafr"]
}
Factor {
Index: 350
CppName: "FI_HAS_TEXT_POS"
Name: "HasTextPos"
Wiki: "<http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/HasTextPos>"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_BINARY, TG_REARR_USE, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The document has text relevance"
Authors: "denplusplus"
Responsibles: ["alsafr", "stash93"]
}
Factor {
Index: 351
CppName: "FI_QSEGMENTS_BM25"
Name: "QSegmentsBM25"
Group: "QSegments"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_NN_OVER_FEATURES_USE]
Description: "BM25, where 'words' are the selected query segments"
Responsibles: "alsafr"
}
Factor {
Index: 352
CppName: "FI_QSEGMENTS_WEIGHT"
Name: "QSegmentsWeight"
Group: "QSegments"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_NN_OVER_FEATURES_USE]
Description: "'The weight of query segments in the text"
Responsibles: "alsafr"
}
Factor {
Index: 353
CppName: "FI_SYN_BAD_WORD_PAIRS"
Name: "SynPercentBadWordPairs"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/antispam?v=186j#h58953-3>"
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The indicator of the unnaturalness in terms of Russian language grammar. The number of bad pairs of words in the text, renormalized to the segment [0,1] according to the formula z/(z+10)"
Responsibles: "alsafr"
}
Factor {
Index: 354
CppName: "FI_SYN_NUM_BAD_WORD_PAIRS"
Name: "SynNumBadWordPairs"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/antispam?v=186j#h58953-3>"
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The percentage of bad pairs among all those found in the table: z/(x+1), where z is the number of bad pairs in the text, and x is the number of ((<http://wiki.yandex-team.ru/EvgenijjGrechnikov/TestSynonimizers> 2000-релевантных)) pairs"
Responsibles: "alsafr"
}
Factor {
Index: 355
CppName: "FI_NUM_LATIN_LETTERS"
Name: "NumLatinLetters"
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The number of Latin letters in the text (excluding comma, hyphen and others), driven into [0,1] by the formula n/(n+100)"
Authors: "grechnik"
Responsibles: "grechnik"
}
Factor {
Index: 356
CppName: "FI_RINGS_HOST_RANK_BADNESS_1"
Name: "RingsHostRankBadness1"
Tags: [TG_LINK_GRAPH, TG_OWNER, TG_STATIC, TG_DEPRECATED]
Description: "The additional factors about the website growth thanks to link circles, ((<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/antispam?v=181r#h58953-4> in more detail))"
Authors: ["denplusplus", "raigorodsky"]
Responsibles: ["raigorodsky", "alsafr"]
}
Factor {
Index: 357
CppName: "FI_DOC_TFIDF_SUM_FIXED"
Name: "DocIdfSumFixed"
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The previous factors have been fixed"
Responsibles: "alsafr"
}
Factor {
Index: 358
CppName: "FI_TITLE_IDF_SUM_FIXED"
Name: "TitleIdfSumFixed"
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The previous factors have been fixed"
Responsibles: "alsafr"
}
Factor {
Index: 359
CppName: "FI_HEADING_IDF_SUM_FIXED"
Name: "HeadingIdfSumFixed"
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The previous factors have been fixed"
Responsibles: "alsafr"
}
Factor {
Index: 360
CppName: "FI_NORMAL_TEXT_IDF_SUM_FIXED"
Name: "NormalTextIdfSumFixed"
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The previous factors have been fixed"
Responsibles: "alsafr"
}
Factor {
Index: 361
CppName: "FI_QUERY_URL_CLICKS_COMBO"
Name: "QueryURLClicksCombo"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_REARR_USE, TG_OFTEN_ZERO, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_90D, TG_USERFEAT_CLICKS_SHOWS, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Countries: CNT_RELEV
Description: "The factor that consists of FRC and pseudo-CTR"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/Клики#queryurldownerclickspctrfrccomboreg>"
Authors: ["lidia", "akhropov"]
Responsibles: ["tarum", "niknik"]
}
Factor {
Index: 362
CppName: "FI_QUERY_DOWNER_CLICKS_COMBO"
Name: "QueryDOwnerClicksCombo"
Tags: [TG_DYNAMIC, TG_DOWNER, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_USER_SEARCH_EXTERNAL, TG_OFTEN_ZERO, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_90D, TG_USERFEAT_CLICKS_SHOWS, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Countries: CNT_RELEV
Description: "The factor that consists of FRC and pseudo-CTR"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/Клики#queryurldownerclickspctrfrccomboreg>"
Authors: ["lidia", "akhropov"]
Responsibles: ["tarum", "niknik"]
}
Factor {
Index: 363
CppName: "FI_LR_AMORTIZED_BY_AGE"
Name: "LRAmortizedByAge"
Group: "Xref"
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: "Link relevance with the pessimization based on older link"
Authors: "dremov"
Responsibles: "dremov"
}
Factor {
Index: 364
CppName: "FI_WORDS_IN_TEXT"
Name: "RusWordsInText"
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The number of words in the text (Word is what the lemmer has highlighted) is displayed in [0,1] by the formula x/(x+A)"
Authors: "grechnik"
Responsibles: "grechnik"
}
Factor {
Index: 365
CppName: "FI_WORDS_IN_TITLE"
Name: "RusWordsInTitle"
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The number of Russian words in the heading"
Responsibles: "alsafr"
}
Factor {
Index: 366
CppName: "FI_MEAN_WORD_LENGTH"
Name: "MeanWordLength"
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The average word length"
Responsibles: "alsafr"
}
Factor {
Index: 367
CppName: "FI_PERCENT_WORDS_IN_LINKS"
Name: "PercentWordsInLinks"
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The percentage of the number of words inside the <a>..</a> tag from the number of all words"
Responsibles: "alsafr"
}
Factor {
Index: 368
CppName: "FI_PERCENT_VISIBLE_CONTENT"
Name: "PercentVisibleContent"
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The percentage of the number of words outside the tags (outside the brackets <>) from the number of all words"
Responsibles: "alsafr"
}
Factor {
Index: 369
CppName: "FI_PERCENT_FREQ_WORDS"
Name: "PercentFreqWords"
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The percentage of the number of words that are the 200 most frequent words of the language, from the number of all words in the text"
Responsibles: "alsafr"
}
Factor {
Index: 370
CppName: "FI_PERCENT_USED_FREQ_WORDS"
Name: "PercentUsedFreqWords"
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The number of the 500 most popular words of the language used in the text, divided by 500"
Responsibles: "alsafr"
}
Factor {
Index: 371
CppName: "FI_TRIGRAMS_PROB"
Name: "TrigramsProb"
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The logarithm of the average geometric probability of trigrams in the text. ((the probability of a trigram is the number of its occurrences in the text divided by the number of all trigrams) , displayed in [0,1] using the formula -x(x+A)"
Responsibles: "alsafr"
}
Factor {
Index: 372
CppName: "FI_TRIGRAMS_COND_PROB"
Name: "TrigramsCondProb"
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The logarithm of the average geometric probability of trigrams. The conditional probability of a trigram is its probability divided by the probability of a digram of the first two words"
Responsibles: "alsafr"
}
Factor {
Index: 373
CppName: "FI_DOPP_DOWNER_PCTR"
Name: "DoppDOwnerPCTR"
Tags: [TG_DYNAMIC, TG_DOWNER, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_DOPP, TG_USER_SEARCH_EXTERNAL, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_90D, TG_USERFEAT_CLICKS_SHOWS, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Countries: CNT_RELEV
Description: "The QueryDOwnerClicksPCTR factor analogue, which differs from QueryDOwnerClicksPCTR because the queries are normalized by doppelgangers (the details of such normalization - у ((<http://staff.yandex-team.ru/finder> Andrey Plakhov)), code -ysite/yandex/doppelgangers)"
Authors: "finder"
Responsibles: ["tarum", "niknik"]
}
Factor {
Index: 374
CppName: "FI_DOPP_DOWNER_PCTR_REG"
Name: "DoppDOwnerPCTR_Reg"
Tags: [TG_DYNAMIC, TG_DOWNER, TG_LOCALIZED_REGION, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_DOPP, TG_USER_SEARCH_EXTERNAL, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_90D, TG_USERFEAT_CLICKS_SHOWS, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Description: "The QueryDOwnerClicksPCTR factor analogue, which differs from QueryDOwnerClicksPCTR because the queries are normalized by doppelgangers (the details of such normalization - у ((<http://staff.yandex-team.ru/finder> Andrey Plakhov)), code -ysite/yandex/doppelgangers). Localized to relev_regions.web.txt"
Authors: "finder"
Responsibles: ["tarum", "niknik"]
}
Factor {
Index: 375
CppName: "FI_DOPP_URL_PCTR"
Name: "DoppUrlPCTR"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_DOPP, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_90D, TG_USERFEAT_CLICKS_SHOWS, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Countries: CNT_RELEV
Description: "The QueryUrlClicksPCTR, factor analogue, which differs from QueryUrlClicksPCTR because the queries are normalized by doppelgangers (the details of such normalization - у ((<http://staff.yandex-team.ru/finder> Andrey Plakhov)), code - ysite/yandex/doppelgangers)"
Authors: "finder"
Responsibles: ["tarum", "niknik"]
}
Factor {
Index: 376
CppName: "FI_DOPP_URL_PCTR_REG"
Name: "DoppUrlPCTR_Reg"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_REGION, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_DOPP, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_90D, TG_USERFEAT_CLICKS_SHOWS, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Description: "The QueryUrlClicksPCTR factor analogue, which differs from it because the queries are normalized by doppelgangers (the details of such normalization - у ((<http://staff.yandex-team.ru/finder> Andrey Plakhov)), code - ysite/yandex/doppelgangers). Localized to relev_regions.web.txt"
Authors: "finder"
Responsibles: ["tarum", "niknik"]
}
Factor {
Index: 377
CppName: "FI_URL_BM25"
Name: "UrlBM25"
AntiSeoUpperBound: 1.0
Wiki: "<http://wiki.yandex-team.ru/YandexLabsDev/MLRFeatureResearch/URLMatch>"
Group: "UrlBM25"
Tags: [TG_DOC, TG_DYNAMIC, TG_URL_TEXT, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "BM25 based on URL"
Authors: "denplusplus"
Responsibles: "alsafr"
}
Factor {
Index: 378
CppName: "FI_HAS_BIG_PICTURE"
Name: "HasBigPicture"
Tags: [TG_DOC, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_NN_OVER_FEATURES_USE]
Description: "The page contains a large image"
Responsibles: "alsafr"
}
Factor {
Index: 379
CppName: "FI_MATRIXNET"
Name: "MatrixNet"
Tags: [TG_DOC, TG_DYNAMIC, TG_TRANS, TG_NOT_01, TG_REARR_USE, TG_UNUSED, TG_L3_MODEL_VALUE]
Description: "The MatrixNet formula is applied to all factors (TG_UNUSED - to prevent entry into any formulas)"
Responsibles: "alsafr"
MinValue: -3e+38
MaxValue: 3e+38
}
Factor {
Index: 380
CppName: "FI_DATER_AGE"
Name: "DaterAge"
Group: "Datetime"
Tags: [TG_DATE, TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The difference between the current date and the document date that was defined by the dater, 1 - the document date is equal to the current one; 0 - the document is 10 years old or more; and if the date is not defined, it is 0. Attention!((1 - DaterAge)*60)^2 = page age in days."
Authors: "velavokr"
Responsibles: "velavokr"
}
Factor {
Index: 381
CppName: "FI_HARD_PESSIMIZATION"
Name: "IsHardPessimization"
Tags: [TG_DOC, TG_STATIC, TG_DEPRECATED, TG_OFTEN_ZERO]
Description: "severe pessimization (aka PR=0), binary factor, which is considered to be in antispam"
Authors: "zudina"
Responsibles: "zudina"
}
Factor {
Index: 382
CppName: "FI_C_IN_DEGREE_1"
Name: "CInDegree1"
Tags: [TG_LINK_GRAPH, TG_OWNER, TG_STATIC, TG_DEPRECATED, TG_UNDOCUMENTED]
Description: "The host factors that determine the websites boosted with bad links - the second and third incoming degrees ((<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/antispam?v=181rh58953-4#cindegree12> in more detail))"
Authors: "vakoshelev"
Responsibles: "vakoshelev"
}
Factor {
Index: 383
CppName: "FI_C_IN_DEGREE_2"
Name: "CInDegree2"
Tags: [TG_LINK_GRAPH, TG_OWNER, TG_STATIC, TG_DEPRECATED, TG_UNDOCUMENTED]
Description: "The host factors that determine the websites boosted with bad links - the second and third incoming degrees ((<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/antispam?v=181rh58953-4#cindegree12> in more detail))"
Authors: "vakoshelev"
Responsibles: "vakoshelev"
}
Factor {
Index: 384
CppName: "FI_NUM_NON_RUSSIAN_LINKS"
Name: "NumNonRussianLinks"
Tags: [TG_DOC, TG_LINK_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_DEPRECATED]
Description: "The number of incoming links without Russian letters. Remapping."
Responsibles: "alsafr"
}
Factor {
Index: 385
CppName: "FI_TEXT_MAX_FORMS"
Name: "TextMaxForms"
Group: "TextForms"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The maximum number of forms on all query words - max over all words of the query number_of_forms_for_word/64"
Responsibles: "alsafr"
}
Factor {
Index: 386
CppName: "FI_TEXT_WEIGHTED_FORMS"
Name: "TextWeightedForms"
Group: "TextForms"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The weighted sum of the number of forms based on the weight of words - the sum of all words of the query number_of_forms_for_word/64*weight_of_word; remap of the form x/(1 + x)."
Responsibles: "alsafr"
}
Factor {
Index: 387
CppName: "FI_TEXT_FORMS"
Name: "TextForms"
Group: "TextForms"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The unweighted sum of the number of forms is the sum of all query words of number_of_forms_for_word/64/number_of_query_words"
Responsibles: "alsafr"
}
Factor {
Index: 388
CppName: "FI_LINK_MAX_FORMS"
Name: "LinkMaxForms"
Group: "LinkForms"
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_UNUSED]
Description: "Maximum number of forms across all query words"
Responsibles: "alsafr"
}
Factor {
Index: 389
CppName: "FI_LINK_WEIGHTED_FORMS"
Name: "LinkWeightedForms"
Group: "LinkForms"
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_REARR_USE, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_UNUSED]
Description: "The sum of the number of forms that’s weighted by the word weights”
Responsibles: "alsafr"
}
Factor {
Index: 390
CppName: "FI_LINK_FORMS"
Name: "LinkForms"
Group: "LinkForms"
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_UNUSED]
Description: "Unweighted sum of number of forms"
Responsibles: "alsafr"
}
Factor {
Index: 391
CppName: "FI_TEXT_RELEV_WEIGHTED_1"
Name: "TR_W1"
Group: "LegacyTR"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_REARR_USE, TG_UNDOCUMENTED, TG_NN_OVER_FEATURES_USE]
Description: "The analogues of the factors with the same name, the word weight = 1"
Authors: "denplusplus"
Responsibles: "alsafr"
}
Factor {
Index: 392
CppName: "FI_LINK_RELEV_WEIGHTED_1"
Name: "XLR_W1"
Group: ["Xref", "Dynamic"]
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: "The analogues of the factors with the same name, the word weight = 1"
Authors: "denplusplus"
Responsibles: "alsafr"
}
Factor {
Index: 393
CppName: "FI_TEXT_BM25_FM_WEIGHTED_1"
Name: "TextBM25_Fm_W1"
Group: "TextBM25"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The analogues of the factors with the same name, the word weight = 1"
Authors: "denplusplus"
Responsibles: "alsafr"
}
Factor {
Index: 394
CppName: "FI_TEXT_BM25_SYN_WEIGHTED_1"
Name: "TextBM25_Sy_W1"
Group: "TextBM25"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The analogues of the factors with the same name, the word weight = 1"
Authors: "denplusplus"
Responsibles: "alsafr"
}
Factor {
Index: 395
CppName: "FI_LINK_BM25_WEIGHTED_1"
Name: "LinkBM25_W1"
Group: "LinkBM25"
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_DEPRECATED]
Description: "The analogues of the factors with the same name, the word weight = 1"
Authors: "denplusplus"
Responsibles: "alsafr"
}
Factor {
Index: 396
CppName: "FI_TLBM25_WEIGHTED_1"
Name: "TLBM25_W1"
Group: "TextAndLinkBM25"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_L2, TG_LINK_TEXT, TG_DEPRECATED]
Description: "The analogues of the factors ofwith the same name, the word weight = 1"
Authors: "denplusplus"
Responsibles: "alsafr"
}
Factor {
Index: 397
CppName: "FI_QSEGMENTS_BREAKS"
Name: "QSegmentsBreaks"
Group: "QSegments"
Tags: [TG_DYNAMIC, TG_DOC, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_NN_OVER_FEATURES_USE]
Description: "Query segments are parts of a query that are frequency queries themselves. The factor shows how the segments are broken down in the text. The value 0 means all words occur only within the specified segments, and 1 means all entries break up the segments"
Authors: "solar"
Responsibles: "solar"
}
Factor {
Index: 398
CppName: "FI_ALICE_MUSIC_TRACK_LYRICS_CMMATCH_TOP5_AVG_MATCH"
Name: "AliceMusicTrackLyricsCMMatchTop5AvgMatch"
Tags: [TG_UNUSED, TG_DYNAMIC, TG_DOC, TG_ALICE_MUSIC, TG_ANNOTATION_NOFILTER, TG_TEXT_MACHINE, TG_ALLOW_USE_FOR_ALICE]
Description: "The CMMatchTop5AvgMatch factor value for the AliceMusic stream"
Wiki: "<https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/lingboost>"
Ticket: ["BUKI-2932"]
Authors: "anrodigina"
Responsibles: ["anrodigina", "gotmanov", "hommforever"]
ImplementationTime: "2020-03-11"
}
Factor {
Index: 399
CppName: "FI_NUMERALS_PORTION"
Name: "NumeralsPortion"
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The percentage of different parts of speech in the text. The percentage of numerals (among all the words in which it was possible to recognize the part of speech)"
Authors: "grechnik"
Responsibles: "grechnik"
}
Factor {
Index: 400
CppName: "FI_PARTICLES_PORTION"
Name: "ParticlesPortion"
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The percentage of particles"
Responsibles: "alsafr"
}
Factor {
Index: 401
CppName: "FI_ADJ_PRONOUNS_PORTION"
Name: "AdjPronounsPortion"
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The percentage of pronominal adjectives"
Responsibles: "alsafr"
}
Factor {
Index: 402
CppName: "FI_ADV_PRONOUNS_PORTION"
Name: "AdvPronounsPortion"
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The percentage of pronominal nouns"
Responsibles: "alsafr"
}
Factor {
Index: 403
CppName: "FI_VERBS_PORTION"
Name: "VerbsPortion"
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The percentage of verbs"
Responsibles: "alsafr"
}
Factor {
Index: 404
CppName: "FI_FEM_MAS_NOUNS_PORTION"
Name: "FemAndMasNounsPortion"
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The percentage of words (among all nouns) that can be both masculine and feminine nouns, but not of neuter gender (examples: 'hummingbird' (rus. kolibri) is an example of an indefinite gender that can be defined in two ways, 'Alexandra' is a homonymy)."
Responsibles: "alsafr"
}
Factor {
Index: 405
CppName: "FI_LINK_QUALITY_FIXED"
Name: "LinkQualityFixed"
Tags: [TG_DOC, TG_LINK_GRAPH, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_UNUSED]
Description: "Quality of incoming links (Leschiner classifier) corrected"
Authors: "somov"
Responsibles: "somov"
}
Factor {
Index: 406
CppName: "FI_HAS_LINK_QUALITY_FIXED"
Name: "HasLinkQualityFixed"
Tags: [TG_DOC, TG_LINK_GRAPH, TG_STATIC, TG_BINARY, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_LINK_TEXT, TG_DEPRECATED]
Description: "Was the LinkQuality calculated for this page or not (it was not if the number of links is low), fixed"
Authors: "somov"
Responsibles: "somov"
}
Factor {
Index: 407
CppName: "FI_NEW_LINK_QUALITY_FIXED"
Name: "NewLinkQualityFixed"
Tags: [TG_DOC, TG_LINK_GRAPH, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_UNUSED]
Description: "The incoming link quality classifier 2, fixed”
Authors: "somov"
Responsibles: "somov"
}
Factor {
Index: 408
CppName: "FI_QUERY_ISORG"
Name: "IsOrg"
DependsOn: [{Feature: ["IsOrg"], Slice: "begemot_query_factors"}]
Group: "Query"
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_THEME_CLASSIF, TG_REARR_USE, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_DEPRECATED]
Description: "The query contains the name of an organization (for instance, Gazprom, Gazproma) ((<http://wiki.yandex-team.ru/ArsenGadzhikurbanov/Wares> description))"
Authors: "arseny"
Responsibles: "arseny"
}
Factor {
Index: 409
CppName: "FI_ALICE_MUSIC_ARTIST_NAME_CM_MATCH_TOP5_AVG_MATCH_VALUE"
Name: "AliceMusicArtistNameCMMatchTop5AvgMatchValue"
Tags: [TG_UNUSED, TG_DYNAMIC, TG_DOC, TG_ALICE_MUSIC, TG_ANNOTATION_NOFILTER, TG_TEXT_MACHINE, TG_ALLOW_USE_FOR_ALICE]
Description: "The CMMatchTop5AvgMatchValue factor value for the AliceMusic stream"
Wiki: "<https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/lingboost>"
Ticket: ["BUKI-2932"]
Authors: "anrodigina"
Responsibles: ["anrodigina", "gotmanov", "hommforever"]
ImplementationTime: "2020-03-11"
}
Factor {
Index: 410
CppName: "FI_LONGEST_TEXT"
Name: "LongestText"
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_REARR_USE, TG_L2, TG_NN_OVER_FEATURES_USE]
Wiki: "<http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/LongText>"
Description: "The size of the largest text segment on the page (from the factor [18] PureText)"
Authors: "denplusplus"
Responsibles: ["tsimkha", "alsafr"]
}
Factor {
Index: 411
CppName: "FI_SMART_UKR"
Name: "SmartUkrainian"
Tags: [TG_DOC, TG_DYNAMIC, TG_LOCALIZED_COUNTRY, TG_URL_TEXT, TG_BINARY, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Authors: "denplusplus"
Responsibles: "alsafr"
}
Factor {
Index: 412
CppName: "FI_SMART_BY"
Name: "SmartBelorussian"
Tags: [TG_DOC, TG_DYNAMIC, TG_LOCALIZED_COUNTRY, TG_URL_TEXT, TG_BINARY, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_NN_OVER_FEATURES_USE]
Authors: "denplusplus"
Responsibles: "alsafr"
}
Factor {
Index: 413
CppName: "FI_LR_WITHOUT_RARE"
Name: "LRWithoutRare"
Group: "LegacyLR"
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_DEPRECATED]
Description: "Link relevance excluding rare words"
Authors: "denplusplus"
Responsibles: "alsafr"
}
Factor {
Index: 414
CppName: "FI_DIFFERENT_INTERNAL_LINKS"
Name: "DifferentInternalLinks"
Tags: [TG_DOC, TG_LINK_GRAPH, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_DEPRECATED]
Description: "The number of different internal links pointing out to this page"
Authors: "somov"
Responsibles: "somov"
}
Factor {
Index: 415
CppName: "FI_HAS_DETERMINED_CITIES"
Name: "HasDeterminedCities"
Tags: [TG_DOC, TG_STATIC, TG_STATIC_REGINFO, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_L3_OVERWRITE, TG_NN_OVER_FEATURES_USE]
Description: "The city is defined for the website"
Authors: "denplusplus"
Responsibles: "alsafr"
}
Factor {
Index: 416
CppName: "FI_REGIONAL_U_QUERY_NEW"
Name: "GeoRegionalityUNew"
DependsOn: [{Feature: ["GeoRegionalityUNew"], Slice: "begemot_query_factors"}]
Tags: [TG_QUERY_ONLY, TG_DYNAMIC, TG_THEME_CLASSIF, TG_REARR_USE, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_DEPRECATED]
Group: "Query"
Description: "The query factors. The result of work ((<http://wiki.yandex-team.ru/PoiskovajaPlatforma/Lingvistika/ZaprosnyjeFactory/LocalizovannyjeZaprosy> query geolocalization classifier)) - new version of factors [328]-[330]: U - geo-useless - the regional query results are useless;"
Authors: "esoloviev"
Responsibles: "esoloviev"
}
Factor {
Index: 417
CppName: "FI_REGIONAL_R_QUERY_NEW"
Name: "GeoRegionalityRNew"
DependsOn: [{Feature: ["GeoRegionalityRNew"], Slice: "begemot_query_factors"}]
Group: "Query"
Tags: [TG_QUERY_ONLY, TG_DYNAMIC, TG_THEME_CLASSIF, TG_REARR_USE, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_DEPRECATED]
Description: "The query factors. The result of work ((<http://wiki.yandex-team.ru/PoiskovajaPlatforma/Lingvistika/ZaprosnyjeFactory/LocalizovannyjeZaprosy> query geolocalization classifier)) - new version of factors [328]-[330]: R - georelevant - the regional query results could be useful but nothing more than that;"
Authors: "esoloviev"
Responsibles: "esoloviev"
}
Factor {
Index: 418
CppName: "FI_REGIONAL_V_QUERY_NEW"
Name: "GeoRegionalityVNew"
DependsOn: [{Feature: ["GeoRegionalityVNew"], Slice: "begemot_query_factors"}]
Group: "Query"
Tags: [TG_QUERY_ONLY, TG_DYNAMIC, TG_THEME_CLASSIF, TG_REARR_USE, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_DEPRECATED]
Description: "The query factors. The result of work ((<http://wiki.yandex-team.ru/PoiskovajaPlatforma/Lingvistika/ZaprosnyjeFactory/LocalizovannyjeZaprosy> query geolocalization classifier)) - new version of factors [328]-[330]: V - geo-vital - the regional query results are essential."
Authors: "esoloviev"
Responsibles: "esoloviev"
}
Factor {
Index: 419
CppName: "FI_ALICE_MUSIC_ARTIST_NAME_PER_WORD_CM_MAX_PREDICTION_MIN"
Name: "AliceMusicArtistNamePerWordCMMaxPredictionMin"
Tags: [TG_UNUSED, TG_DYNAMIC, TG_DOC, TG_ALICE_MUSIC, TG_ANNOTATION_NOFILTER, TG_TEXT_MACHINE, TG_ALLOW_USE_FOR_ALICE]
Description: "The PerWordCMMaxPredictionMin factor value for the AliceMusic stream"
Wiki: "<https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/lingboost>"
Ticket: ["BUKI-2932"]
Authors: "anrodigina"
Responsibles: ["anrodigina", "gotmanov", "hommforever"]
ImplementationTime: "2020-03-11"
}
Factor {
Index: 420
CppName: "FI_PAGE_RANK_UKR"
Name: "UkrainPageRank"
Tags: [TG_DOC, TG_LINK_GRAPH, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_UNUSED]
Description: "Ukrainian Page rank"
Responsibles: "alsafr"
}
Factor {
Index: 421
CppName: "FI_QCLASS_DOWNLOAD"
Name: "QClassDownload"
DependsOn: [{Feature: ["QClassDownload"], Slice: "begemot_query_factors"}]
Group: "Query"
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_THEME_CLASSIF, TG_BINARY, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_DEPRECATED]
Description: "=1 - incl. the Download formula. Queries of the category: download/watch online/play/photo/listen to"
Authors: "asannikova"
Responsibles: "alsafr"
}
Factor {
Index: 422
CppName: "FI_QCLASS_BRANDNAMES"
Name: "QClassBrandnames"
DependsOn: [{Feature: ["QClassBrandnames"], Slice: "begemot_query_factors"}]
Group: "Query"
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_THEME_CLASSIF, TG_BINARY, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_DEPRECATED]
Description: "The result of the query classifier is that the query contains words from the corresponding dictionary. Brand"
Authors: "agorodilov"
Responsibles: "agorodilov"
}
Factor {
Index: 423
CppName: "FI_QCLASS_DISEASE"
Name: "QClassDisease"
DependsOn: [{Feature: ["QClassDisease"], Slice: "begemot_query_factors"}]
Group: "Query"
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_THEME_CLASSIF, TG_BINARY, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_DEPRECATED]
Description: "medical dictionary"
Authors: "agorodilov"
Responsibles: "agorodilov"
}
Factor {
Index: 424
CppName: "FI_QCLASS_KAK"
Name: "QClassKak"
DependsOn: [{Feature: ["QClassKak"], Slice: "begemot_query_factors"}]
Group: "Query"
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_THEME_CLASSIF, TG_BINARY, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_DEPRECATED]
Description: "question"
Authors: "agorodilov"
Responsibles: "agorodilov"
}
Factor {
Index: 425
CppName: "FI_QCLASS_MOSCOW"
Name: "QClassMoscow"
DependsOn: [{Feature: ["QClassMoscow"], Slice: "begemot_query_factors"}]
Group: "Query"
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_THEME_CLASSIF, TG_BINARY, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_DEPRECATED]
Description: "the query applies to Moscow"
Authors: "agorodilov"
Responsibles: "agorodilov"
}
Factor {
Index: 426
CppName: "FI_QCLASS_OAO"
Name: "QClassOAO"
DependsOn: [{Feature: ["QClassOAO"], Slice: "begemot_query_factors"}]
Group: "Query"
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_THEME_CLASSIF, TG_BINARY, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_DEPRECATED]
Description: "organization"
Authors: "agorodilov"
Responsibles: "agorodilov"
}
Factor {
Index: 427
CppName: "FI_QCLASS_PORNO"
Name: "QClassPorno"
DependsOn: [{Feature: ["QClassPorno"], Slice: "begemot_query_factors"}]
Group: "Query"
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_THEME_CLASSIF, TG_BINARY, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_DEPRECATED]
Description: "porn"
Authors: "agorodilov"
Responsibles: "agorodilov"
}
Factor {
Index: 428
CppName: "FI_QCLASS_TRAVEL"
Name: "QClassTravel"
DependsOn: [{Feature: ["QClassTravel"], Slice: "begemot_query_factors"}]
Group: "Query"
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_THEME_CLASSIF, TG_BINARY, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_DEPRECATED]
Description: "traveling"
Authors: "agorodilov"
Responsibles: "agorodilov"
}
Factor {
Index: 429
CppName: "FI_VIDEO_RATING"
Name: "VideoRating"
Ticket: "VIDEOPOISK-342"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/VideoRating>"
Tags: [TG_DOC, TG_STATIC, TG_DEPRECATED, TG_OFTEN_ZERO]
Description: "The popularity of the video which comes from the video"
Comment: "Outdated. Must be eliminated"
Authors: "bort"
Responsibles: "bort"
}
Factor {
Index: 430
CppName: "FI_PERIODIC_LINK_DATES_PERCENT"
Name: "PeriodicLinkDatesPercent"
Tags: [TG_DOC, TG_LINK_GRAPH, TG_STATIC, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_UNUSED]
Description: "The periodicity of links pointing out to the website"
Authors: "dremov"
Responsibles: "dremov"
}
Factor {
Index: 431
CppName: "FI_LINK_ALMOST_PERIOD"
Name: "LinkAlmostPeriod"
Tags: [TG_DOC, TG_LINK_GRAPH, TG_STATIC, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_UNUSED]
Description: "The number of near-periodic links"
Authors: "dremov"
Responsibles: "dremov"
}
Factor {
Index: 432
CppName: "FI_QDOWNER_STAT_POWER"
Name: "QDOwnerStatPower"
Tags: [TG_DYNAMIC, TG_DOWNER, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_USER_SEARCH_EXTERNAL, TG_REARR_USE, TG_OFTEN_ZERO, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_90D, TG_USERFEAT_CLICKS_SHOWS, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Countries: CNT_RELEV
Description: "The number of owner's impressions for the query, normalization x/(100 + x)."
Authors: "solar"
Responsibles: ["tarum", "niknik"]
}
Factor {
Index: 433
CppName: "FI_QURL_STAT_POWER"
Name: "QUrlStatPower"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_REARR_USE, TG_OFTEN_ZERO, TG_USER_SEARCH_EXTERNAL, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_90D, TG_USERFEAT_CLICKS_SHOWS, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Countries: CNT_RELEV
Description: "The number of how much the URL is shown for the query, normalization x/(100 + x)."
Authors: "solar"
Responsibles: ["tarum", "niknik"]
}
Factor {
Index: 434
CppName: "FI_HAS_LIRU_CNT"
Name: "HasLiRuCounter"
Tags: [TG_DOC, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The presence of the LiveInternet counter"
Authors: "denplusplus"
Responsibles: "alsafr"
}
Factor {
Index: 435
CppName: "FI_OWNER_REQS_POPULARITY"
Name: "OwnerReqsPopularity"
Tags: [TG_STATIC, TG_OWNER, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_L2, TG_DEPRECATED]
Wiki: "<https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/OwnerReqsPopularity>"
Description: "The owner’s popularity in queries"
Authors: "denplusplus"
Responsibles: ["diver", "akhropov"]
}
Factor {
Index: 436
CppName: "FI_DSSM_YA_MUSIC_ASR_EARLY_BINDING_CE"
Name: "DssmYaMusicASREarlyBindingCe"
Tags: [TG_DYNAMIC, TG_DOC, TG_USER, TG_USER_SEARCH, TG_URL_TEXT, TG_DOC_TEXT, TG_DOC_CONTENT, TG_NEURAL, TG_UNUSED, TG_ALICE_MUSIC, TG_RTMODELS_SERVICE, TG_ALLOW_USE_FOR_ALICE]
Description: "DSSM model with early binding, trained on reformulations and additionally trained on the ASR hypotheses of musical queries for Alice"
Ticket: "BUKI-2960"
Authors: ["islobodskov", "anrodigina"]
Responsibles: ["islobodskov", "anrodigina"]
}
Factor {
Index: 437
CppName: "FI_DSSM_BERT_DISTILL_SINSIG_CE_COUNTRY_REG_CHAIN"
Name: "DssmBertDistillSinsigCeCountryRegChain"
Tags: [TG_DYNAMIC, TG_DOC, TG_USER, TG_USER_SEARCH, TG_URL_TEXT, TG_DOC_TEXT, TG_NEURAL, TG_USE_MARKUP, TG_ALL_RELEVANCE_MARKUP, TG_SIN_SIG_MARKUP, TG_BERT_DISTILL, TG_UNIMPLEMENTED, TG_DEPRECATED]
Description: "The model was trained on a set on PRS-log for the Bert prediction, which was trained on sinsig_ce with a threshold 0.5, using a chain of regions to a country"
UseArtifact: {Name: "DssmBertDistillSinsigCeCountryRegChain"}
Ticket: "FACTOR-2287"
Authors: ["ivaninap", "rmplstiltskin"]
Responsibles: ["ivaninap", "rmplstiltskin"]
}
Factor {
Index: 438
CppName: "FI_DSSM_YA_MUSIC_EARLY_BINDING_CE"
Name: "DssmYaMusicEarlyBindingCe"
Tags: [TG_DYNAMIC, TG_DOC, TG_USER, TG_USER_SEARCH, TG_URL_TEXT, TG_DOC_TEXT, TG_DOC_CONTENT, TG_NEURAL, TG_UNDOCUMENTED, TG_UNUSED, TG_ALICE_MUSIC, TG_RTMODELS_SERVICE, TG_ALLOW_USE_FOR_ALICE]
Description: "DSSM model with early binding, trained on reformulations and additionally trained on the musical queries for Alice"
Ticket: "BUKI-2950"
Authors: "islobodskov"
Responsibles: "islobodskov"
ImplementationTime: "2020-03-17"
}
Factor {
Index: 439
CppName: "FI_SECOND_INDEG_DISTR_XI"
Name: "SecondIndegDistrXi"
Tags: [TG_LINK_GRAPH, TG_OWNER, TG_STATIC, TG_DEPRECATED, TG_UNDOCUMENTED]
Description: "Eleven factors based on the statistical properties of the distributions of incoming vertex degrees, which refer to a fixed vertex of the hostgraph.((<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/hostdegree> in more detail))"
Authors: "filimonov"
Responsibles: "alsafr"
}
Factor {
Index: 440
CppName: "FI_PIRACY_DETECTOR_PREDICT"
Name: "PiracyDetectorPredict"
Ticket: "COMMERCIAL-4"
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_USER, TG_L2, TG_QUERY_DETECTOR_PREDICT, TG_NOT_01, TG_UNUSED]
Description: "The value of the piracy detector calculated in the Рippopotamus (algorithm)."
MinValue: -10
MaxValue: 10
Authors: ["alejes", "hygge"]
Responsibles: ["alejes", "hygge"]
ImplementationTime: "2020-08-17"
}
Factor {
Index: 441
CppName: "FI_ALICE_MUSIC_URL_TYPE_IS_ALBUM"
Name: "AliceMusicUrlTypeIsAlbum"
Tags: [TG_DOC, TG_ALICE_MUSIC, TG_URL_TEXT, TG_BINARY, TG_NN_OVER_FEATURES_USE]
Description: "The canonicalized URL type of Yandex music - album"
Ticket: "BUKI-2932"
Authors: ["anrodigina", "gotmanov"]
Responsibles: ["anrodigina", "gotmanov"]
ImplementationTime: "2020-03-11"
}
Factor {
Index: 442
CppName: "FI_FIRST_VALID_TS_10DAYS"
Name: "FirstValidTs10Days"
Group: "Datetime"
Ticket: "WEBFRESH-695"
Tags: [TG_DATE, TG_DOC, TG_STATIC, TG_FRESHNESS_USE, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "Is calculated as (10-x) where x — the age of the document in days (continuously) in relation to document validity time in Yandex index"
Authors: "alejes"
Responsibles: "alejes"
ImplementationTime: "2020-09-27"
}
Factor {
Index: 443
CppName: "FI_HOST_IN_QUERY"
Name: "HostInQuery"
Tags: [TG_DYNAMIC, TG_HOST, TG_URL_TEXT, TG_BINARY, TG_OFTEN_ZERO, TG_L2, TG_UNUSED]
Description: "The document host is recognized in the query"
Ticket: "WEBFRESH-623"
Authors: "alejes"
Responsibles: "alejes"
ImplementationTime: "2020-04-18"
}
Factor {
Index: 444
CppName: "FI_VITAL_HOST_IN_QUERY"
Name: "VitalHostInQuery"
Tags: [TG_DYNAMIC, TG_DOC, TG_URL_TEXT, TG_BINARY, TG_OFTEN_ZERO, TG_L2, TG_UNUSED]
Description: "The URL only consists of the host that is recognized in the query"
Ticket: "WEBFRESH-623"
Authors: "alejes"
Responsibles: "alejes"
ImplementationTime: "2020-04-18"
}
Factor {
Index: 445
CppName: "FI_YANDEX_NEWS_STORY_URL"
Name: "YandexNewsStoryUrl"
Tags: [TG_DYNAMIC, TG_DOC, TG_URL_TEXT, TG_BINARY, TG_OFTEN_ZERO, TG_L2, TG_UNUSED]
Description: "The URL is the subject of Yandex news"
Ticket: "WEBFRESH-685"
Authors: ["hygge", "alejes"]
Responsibles: ["hygge", "alejes"]
ImplementationTime: "2020-08-28"
}
Factor {
Index: 446
CppName: "FI_RC_SPYLOG_URL_RATIONAL_SIGMOID_D1T240"
Name: "RcSpylogUrlRationalSigmoidD1T240"
Group: "RapidClicks"
Tags: [TG_STATIC, TG_DOC, TG_USER, TG_BROWSER, TG_L2, TG_DATA_FROM_BIGRT, TG_UNDOCUMENTED, TG_UNIMPLEMENTED, TG_UNUSED]
Description: "URL feature computed from rapid clicks spy_log counters with decay of 1 day"
Ticket: "USERFEAT-1493"
Authors: ["skorodumov-s"]
Responsibles: ["skorodumov-s", "tarum"]
}
Factor {
Index: 447
CppName: "FI_RC_SPYLOG_URL_RATIONAL_SIGMOID_D1T240_FROZEN"
Name: "RcSpylogUrlRationalSigmoidD1T240Frozen"
Group: "RapidClicks"
Tags: [TG_STATIC, TG_DOC, TG_USER, TG_BROWSER, TG_L2, TG_DATA_FROM_BIGRT, TG_UNDOCUMENTED, TG_SPYLOG_RAPID_CLICKS_BIGRT, TG_NN_OVER_FEATURES_USE]
Description: "URL feature computed from rapid clicks spy_log counters with decay of 1 day"
Ticket: "USERFEAT-1493"
Authors: ["skorodumov-s"]
Responsibles: ["skorodumov-s", "tarum"]
ImplementationTime: "2020-09-01"
}
Factor {
Index: 448
CppName: "FI_RC_SPYLOG_URL_RATIONAL_SIGMOID_D0_5T30"
Name: "RcSpylogUrlRationalSigmoidD0_5T30"
Group: "RapidClicks"
Tags: [TG_STATIC, TG_DOC, TG_USER, TG_BROWSER, TG_L2, TG_DATA_FROM_BIGRT, TG_UNDOCUMENTED, TG_UNIMPLEMENTED, TG_UNUSED]
Description: "URL feature computed from rapid clicks spy_log counters with decay of 0.5 days"
Ticket: "USERFEAT-1493"
Authors: ["skorodumov-s"]
Responsibles: ["skorodumov-s", "tarum"]
}
Factor {
Index: 449
CppName: "FI_RC_SPYLOG_URL_RATIONAL_SIGMOID_D0_5T30_FROZEN"
Name: "RcSpylogUrlRationalSigmoidD0_5T30Frozen"
Group: "RapidClicks"
Tags: [TG_STATIC, TG_DOC, TG_USER, TG_BROWSER, TG_L2, TG_DATA_FROM_BIGRT, TG_UNDOCUMENTED, TG_SPYLOG_RAPID_CLICKS_BIGRT, TG_NN_OVER_FEATURES_USE]
Description: "URL feature computed from rapid clicks spy_log counters with decay of 0.5 day"
Ticket: "USERFEAT-1493"
Authors: ["skorodumov-s"]
Responsibles: ["skorodumov-s", "tarum"]
ImplementationTime: "2020-09-01"
}
Factor {
Index: 450
CppName: "FI_TIMESTAMP"
Name: "Timestamp"
Group: "Datetime"
Tags: [TG_DATE, TG_DOC, TG_STATIC, TG_REARR_USE, TG_FRESHNESS_USE, TG_UNUSED]
Description: "It is calculated as (80 - x) / 80, where x is the age of the document in hours. The factors only make sense for the fastbot base (last 80 hours). They are not used in ranking. They are used in re-ranking.”
Authors: "melton"
Responsibles: ["melton", "alsafr"]
}
Factor {
Index: 451
CppName: "FI_ADD_TIME_FULL"
Name: "AddTimeFull"
Group: "Datetime"
Tags: [TG_DATE, TG_DOC, TG_STATIC, TG_REARR_USE, TG_FRESHNESS_USE, TG_UNUSED]
Description: "It is calculated as (80 - x) / 80, where x is the age of the document in hours. The factors only make sense for the fastbot base (last 80 hours). They are not used in ranking. They are used in re-ranking."
Authors: "melton"
Responsibles: ["melton", "alsafr"]
}
Factor {
Index: 452
CppName: "FI_SWBM25"
Name: "Swbm25"
Wiki: "<http://wiki.yandex-team.ru/SWBM25>"
Group: "SWBM25"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_DEPRECATED]
Description: "Sly BM25 in a sliding window. The window size is specified in the sentences. “Jokers” are used for headings and the beginning of the document.
The morphological similarity and structure of the text are considered. Window weight fades away while withdrawing from the beginning of the document."
Authors: "alsafr"
Responsibles: "alsafr"
}
Factor {
Index: 453
CppName: "FI_PLM"
Name: "PositionLanguageModel"
Ticket: "COMBPROLAB-51"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/PositionLanguageModel>"
Group: "PositionLanguageModel"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_REARR_USE, TG_DEPRECATED]
Description: "This is a factor shows how good a snippet can be created."
Responsibles: "alsafr"
}
Factor {
Index: 454
CppName: "FI_TEXT_PAIR_W1"
Name: "TxtPair_W1"
Group: "TextBM25"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "A simple BM25 on word pairs - we take all pairs of query words and count the number of their occurrences in the document text. Weight =1. Comm doesn't work if there is a stop word in the query"
Authors: "gulin"
Responsibles: "gulin"
}
Factor {
Index: 455
CppName: "FI_AURA_DOC_LOG_SHARED"
Name: "AuraDocLogShared"
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_DEPRECATED]
Description: "Logarithm of the number of shingles on which the given document is not unique"
Authors: "antonovvk"
Responsibles: ["antonovvk", "smax"]
}
Factor {
Index: 456
CppName: "FI_AURA_DOC_LOG_AUTHOR"
Name: "AuraDocLogAuthor"
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_DEPRECATED]
Description: "Logarithm of the number of shingles on which the given document owner is recognized as the author”
Authors: "antonovvk"
Responsibles: ["antonovvk", "smax"]
}
Factor {
Index: 457
CppName: "FI_AURA_DOC_MEAN_SHARED_WEIGHT"
Name: "AuraDocMeanSharedWeight"
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_DEPRECATED]
Description: "The average weight of non-unique shingles in a given document"
Authors: "antonovvk"
Responsibles: ["antonovvk", "smax"]
}
Factor {
Index: 458
CppName: "FI_MARKET_QUALITY_RATING"
Name: "MarketQualityRating"
Tags: [TG_OWNER, TG_STATIC, TG_OFTEN_ZERO, TG_COMMERCIAL, TG_NN_OVER_FEATURES_USE]
Description: "Mascot feature MarketQualityRating"
Ticket: "SEARCHSPAM-15531"
Authors: ["bikulov"]
Responsibles: ["bikulov", "sdormidontov"]
ImplementationTime: "2020-09-30"
}
Factor {
Index: 459
CppName: "FI_MEDICAL2_HOST_QUALITY"
Name: "Medical2HostQuality"
Ticket: "SENS-87"
Authors: ["anrodigina"]
Responsibles: ["anrodigina", "hommforever"]
Description: "Medical host quality for new marks."
Tags: [TG_HOST, TG_STATIC, TG_OFTEN_ZERO, TG_UNUSED, TG_NOT_01]
MinValue: -1
MaxValue: 1
ImplementationTime: "2021-01-12"
}
Factor {
Index: 460
CppName: "FI_MEDICAL2_HOST_QUALITY_FRESH"
Name: "Medical2HostQualityFresh"
Ticket: "SENS-87"
Authors: ["anrodigina"]
Responsibles: ["anrodigina", "hommforever"]
Description: "Medical host quality for new marks for experiments."
Tags: [TG_HOST, TG_STATIC, TG_OFTEN_ZERO, TG_UNUSED, TG_NOT_01]
MinValue: -1
MaxValue: 1
ImplementationTime: "2021-01-12"
}
Factor {
Index: 461
CppName: "FI_FIN_LAW_HOST_QUALITY"
Name: "FinLawHostQuality"
Ticket: "SENS-85"
Authors: ["anrodigina"]
Responsibles: ["anrodigina", "hommforever"]
Description: "Finance or law host quality for new marks."
Tags: [TG_HOST, TG_STATIC, TG_OFTEN_ZERO, TG_UNUSED, TG_NOT_01, TG_USED_IN_CONF_REARR]
MinValue: -1
MaxValue: 1
ImplementationTime: "2021-01-12"
}
Factor {
Index: 462
CppName: "FI_FIN_LAW_HOST_QUALITY_FRESH"
Name: "FinLawHostQualityFresh"
Ticket: "SENS-85"
Authors: ["anrodigina"]
Responsibles: ["anrodigina", "hommforever"]
Description: "Finance or law host quality for new marks for experiments."
Tags: [TG_HOST, TG_STATIC, TG_OFTEN_ZERO, TG_UNUSED, TG_NOT_01]
MinValue: -1
MaxValue: 1
ImplementationTime: "2021-01-12"
}
Factor {
Index: 463
CppName: "FI_SOS_HOST_QUALITY"
Name: "SosHostQuality"
Ticket: "SENS-84"
Authors: ["anrodigina"]
Responsibles: ["anrodigina", "hommforever"]
Description: "Finance or law host quality for new marks."
Tags: [TG_HOST, TG_STATIC, TG_OFTEN_ZERO, TG_UNUSED, TG_UNIMPLEMENTED, TG_NOT_01]
MinValue: -1
MaxValue: 1
ImplementationTime: "2021-01-12"
}
Factor {
Index: 464
CppName: "FI_SOS_HOST_QUALITY_FRESH"
Name: "SosHostQualityFresh"
Ticket: "SENS-84"
Authors: ["anrodigina"]
Responsibles: ["anrodigina", "hommforever"]
Description: "Finance or law host quality for new marks for experiments."
Tags: [TG_HOST, TG_STATIC, TG_OFTEN_ZERO, TG_UNUSED, TG_UNIMPLEMENTED, TG_NOT_01]
MinValue: -1
MaxValue: 1
ImplementationTime: "2021-01-12"
}
Factor {
Index: 465
CppName: "FI_CS_DOCUMENTATION_HOST"
Name: "CsDocumentationHost"
Ticket: "SEARCHPLAY-101"
Authors: "alejes"
Responsibles: "alejes"
Description: "Factor for host in list of documentation cs hosts for experiments"
Tags: [TG_HOST, TG_STATIC, TG_OFTEN_ZERO, TG_UNUSED, TG_UNIMPLEMENTED]
}
Factor {
Index: 466
CppName: "FI_REMOVED_466"
Name: "Remved_466"
Tags: [TG_REMOVED]
}
Factor {
Index: 467
CppName: "FI_REG_HOST_RANK"
Name: "RegHostRank"
Group: "RegHostStatic"
Tags: [TG_LOCALIZED_COUNTRY, TG_LINK_GRAPH, TG_OWNER, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_DEPRECATED]
Description: "It is calculated the same way as the HostRank factor, but not on the whole owner-graph but on its subgraph, which consists of the given region’s owners. Belonging to a region is determined by TLD, or by the presence of pages from the given owner in the index, which are recognized to be from this region by the geo or geoa classifier. It is mapped the same way as the HostRank factor, with a number from 0 to 1 with 256 gradations"
Authors: "yoda"
Responsibles: "alsafr"
}
Factor {
Index: 468
CppName: "FI_REG_IS_WIKI"
Name: "RegIsWiki"
Group: "RegHostStatic"
Tags: [TG_LOCALIZED_COUNTRY, TG_HOST, TG_STATIC, TG_WIKIPEDIA, TG_UNDOCUMENTED, TG_L2, TG_REARR_USE, TG_NN_OVER_FEATURES_USE]
Description: "The document is from the language section of Wikipedia that is the same as the user's region"
Authors: "yoda"
Responsibles: "alsafr"
}
Factor {
Index: 469
CppName: "FI_LANGUAGE_COMPLIANCE"
Name: "LanguageCompliance"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_BINARY, TG_REARR_USE, TG_UNDOCUMENTED, TG_NN_OVER_FEATURES_USE]
Description: "The document language matches the language of the query"
Authors: "ekrokhalev"
Responsibles: "lamo"
}
Factor {
Index: 470
CppName: "FI_COUNTRY_POPULAR_Q"
Name: "CountryPopularQ"
DependsOn: [{Feature: ["CountryPopularQ"], Slice: "begemot_query_factors"}]
Group: "Query"
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_REARR_USE, TG_OFTEN_ZERO, TG_L2, TG_DEPRECATED]
Countries: CNT_ALL
Description: "Query popularity within the country"
Wiki: "<http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/PopularQ>"
Authors: "denplusplus"
Responsibles: ["diver", "akhropov"]
}
Factor {
Index: 471
CppName: "FI_COUNTRY_Q_DIVERSITY"
Name: "CountryQDiversity"
DependsOn: [{Feature: ["CountryQDiversity"], Slice: "begemot_query_factors"}]
Group: "Query"
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_REARR_USE, TG_OFTEN_ZERO, TG_L2, TG_DEPRECATED]
Countries: CNT_ALL
Description: "The degree of centralization of the points from which the query is made (within the country)"
Wiki: "<http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/QDiversity>"
Authors: "denplusplus"
Responsibles: ["diver", "akhropov"]
}
Factor {
Index: 472
CppName: "FI_COUNTRY_Q_DIVERSITY2"
Name: "CountryQDiversity2"
DependsOn: [{Feature: ["CountryQDiversity2"], Slice: "begemot_query_factors"}]
Group: "Query"
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_REARR_USE, TG_OFTEN_ZERO, TG_L2, TG_DEPRECATED]
Countries: CNT_ALL
Description: "Geographic distribution of the query within the country"
Wiki: "<http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/Diversity2>"
Authors: "denplusplus"
Responsibles: ["diver", "akhropov"]
}
Factor {
Index: 473
CppName: "FI_COUNTRY_HOUR"
Name: "CountryHour"
DependsOn: [{Feature: ["CountryHour"], Slice: "begemot_query_factors"}]
Group: "Query"
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_OFTEN_ZERO, TG_L2, TG_DEPRECATED]
Countries: CNT_ALL
Description: "The hour during which this query is used most frequently"
Wiki: "<http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/HourDiversity>"
Authors: "denplusplus"
Responsibles: ["diver", "akhropov"]
}
Factor {
Index: 474
CppName: "FI_COUNTRY_HOUR_DIVERSITY"
Name: "CountryHourDiversity"
DependsOn: [{Feature: ["CountryHourDiversity"], Slice: "begemot_query_factors"}]
Group: "Query"
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_OFTEN_ZERO, TG_L2, TG_DEPRECATED]
Countries: CNT_ALL
Description: "How often the query is used in different times of the day (within the country)"
Wiki: "<http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/HourDiversity>"
Authors: "denplusplus"
Responsibles: ["diver", "akhropov"]
}
Factor {
Index: 475
CppName: "FI_REMOVED_475"
Name: "Removed_475"
Tags: [TG_REMOVED]
}
Factor {
Index: 476
CppName: "FI_NATIONAL_DOMAIN"
Name: "NationalDomain"
Tags: [TG_DOC, TG_DYNAMIC, TG_LOCALIZED_COUNTRY, TG_BINARY, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The document country (domain) and the user country match ((<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/OpisanijaFaktorov#nationaldomain> in more detail))"
Authors: "vvp"
Responsibles: "alsafr"
}
Factor {
Index: 477
CppName: "FI_IS_PORNO_ADVERT"
Name: "IsPornoAdvert"
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_BINARY, TG_REARR_USE, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The page contains porn ads"
Wiki: "<http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/IsPornoAdvert>"
Authors: "ashagarov"
Responsibles: "ashagarov"
}
Factor {
Index: 478
CppName: "FI_RC_SPYLOG_URL_RATIONAL_SIGMOID_D3T120"
Name: "RcSpylogUrlRationalSigmoidD3T120"
Group: "RapidClicks"
Tags: [TG_STATIC, TG_DOC, TG_USER, TG_BROWSER, TG_L2, TG_DATA_FROM_BIGRT, TG_UNDOCUMENTED, TG_UNIMPLEMENTED, TG_UNUSED]
Description: "URL feature computed from rapid clicks spy_log counters with decay of 3 days"
Ticket: "USERFEAT-1493"
Authors: ["skorodumov-s"]
Responsibles: ["skorodumov-s", "tarum"]
}
Factor {
Index: 479
CppName: "FI_COUNTRY_QUERY_REGIONALITY"
Name: "CountryQueryRegionality"
DependsOn: [{Feature: ["CountryQueryRegionality"], Slice: "begemot_query_factors"}]
Group: "Query"
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_THEME_CLASSIF, TG_UNDOCUMENTED, TG_L2, TG_DEPRECATED]
Description: "The country localizability classifier - shows how much the query implies country context"
Authors: "shutovich"
Responsibles: "shutovich"
}
Factor {
Index: 480
CppName: "FI_NUM_SLASHES"
Name: "NumSlashes"
Tags: [TG_DOC, TG_STATIC, TG_URL_TEXT, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "Number of slashes in the URL"
Authors: "denplusplus"
Responsibles: "alsafr"
}
Factor {
Index: 481
CppName: "FI_BM25F_DPR_OBSOLETE"
Name: "BM25FdPR_obsolete"
Group: "BM25F"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_REARR_USE, TG_UNUSED, TG_L2]
Description: "BM25 with different parameters for different fields, including incoming anchor text. The text weights of the links included in the page are normalized depending on the delta page rank of the link."
Authors: ["grechnik", "kustarev"]
Responsibles: "grechnik"
}
Factor {
Index: 482
CppName: "FI_WATCH_VIDEO"
Name: "WatchVideo"
Tags: [TG_DOC, TG_STATIC, TG_REARR_USE, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The presence of a built-in video player on the page"
Responsibles: "osenzen"
}
Factor {
Index: 483
CppName: "FI_DOWNLOAD_VIDEO"
Name: "DownloadVideo"
Tags: [TG_DOC, TG_STATIC, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "Video for downloading"
Responsibles: "alsafr"
}
Factor {
Index: 484
CppName: "FI_RC_SPYLOG_URL_RATIONAL_SIGMOID_D3T120_FROZEN"
Name: "RcSpylogUrlRationalSigmoidD3T120Frozen"
Group: "RapidClicks"
Tags: [TG_STATIC, TG_DOC, TG_USER, TG_BROWSER, TG_L2, TG_DATA_FROM_BIGRT, TG_UNDOCUMENTED, TG_SPYLOG_RAPID_CLICKS_BIGRT, TG_NN_OVER_FEATURES_USE]
Description: "URL feature computed from rapid clicks spy_log counters with decay of 3 days"
Ticket: "USERFEAT-1493"
Authors: ["skorodumov-s"]
Responsibles: ["skorodumov-s", "tarum"]
ImplementationTime: "2020-09-01"
}
Factor {
Index: 485
CppName: "FI_RC_SPYLOG_URL_RATIONAL_SIGMOID_D14T300"
Name: "RcSpylogUrlRationalSigmoidD14T300"
Group: "RapidClicks"
Tags: [TG_STATIC, TG_DOC, TG_USER, TG_BROWSER, TG_L2, TG_DATA_FROM_BIGRT, TG_UNDOCUMENTED, TG_UNIMPLEMENTED, TG_UNUSED]
Description: "URL feature computed from rapid clicks spy_log counters with decay of 14 days"
Ticket: "USERFEAT-1493"
Authors: ["skorodumov-s"]
Responsibles: ["skorodumov-s", "tarum"]
}
Factor {
Index: 486
CppName: "FI_SUBRELEV"
Name: "SubRelevance"
Tags: [TG_DOC, TG_TRANS, TG_REARR_USE, TG_UNUSED, TG_OFTEN_ZERO]
Description: "A service factor that was needed to search on the website, and will still be needed in the future."
Authors: "karpik"
Responsibles: "apos"
}
Factor {
Index: 487
CppName: "FI_GSK_URL_MODEL"
Name: "GskUrlModel"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/gsk>"
Tags: [TG_DOC, TG_STATIC, TG_URL_TEXT, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The factor is calculated from the URL text using the quality/seq/gsk sequence classifier"
Authors: "gulin"
Responsibles: "gulin"
}
Factor {
Index: 488
CppName: "FI_URL_TRIGRAMS"
Name: "UrlTrigrams"
Wiki: "<http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/UrlTrigrams>"
Tags: [TG_DOC, TG_STATIC, TG_URL_TEXT, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "Model with training of each trigram on '+' and '-' URLs. It does not depend on the query."
Authors: ["botay", "denplusplus"]
Responsibles: "alsafr"
}
Factor {
Index: 489
CppName: "FI_RC_SPYLOG_URL_RATIONAL_SIGMOID_D14T300_FROZEN"
Name: "RcSpylogUrlRationalSigmoidD14T300Frozen"
Group: "RapidClicks"
Tags: [TG_STATIC, TG_DOC, TG_USER, TG_BROWSER, TG_L2, TG_DATA_FROM_BIGRT, TG_UNDOCUMENTED, TG_SPYLOG_RAPID_CLICKS_BIGRT, TG_NN_OVER_FEATURES_USE]
Description: "URL feature computed from rapid clicks spy_log counters with decay of 14 days"
Ticket: "USERFEAT-1493"
Authors: ["skorodumov-s"]
Responsibles: ["skorodumov-s", "tarum"]
ImplementationTime: "2020-09-01"
}
Factor {
Index: 490
CppName: "FI_RC_SPYLOG_AGE"
Name: "RcSpylogAge"
Group: "RapidClicks"
Tags: [TG_STATIC, TG_DOC, TG_USER, TG_BROWSER, TG_L2, TG_DATA_FROM_BIGRT, TG_NOT_01, TG_UNDOCUMENTED, TG_UNIMPLEMENTED, TG_UNUSED]
Description: "Age of rapid clicks spy_log update, in seconds"
Ticket: "USERFEAT-1493"
Authors: ["skorodumov-s"]
Responsibles: ["skorodumov-s", "tarum"]
MinValue: 0
MaxValue: 2592000
}
Factor {
Index: 491
CppName: "FI_RC_SPYLOG_FRESHNESS"
Name: "RcSpylogFreshness"
Group: "RapidClicks"
Tags: [TG_STATIC, TG_DOC, TG_USER, TG_BROWSER, TG_L2, TG_DATA_FROM_BIGRT, TG_UNDOCUMENTED, TG_UNIMPLEMENTED, TG_UNUSED]
Description: "Freshness of rapid clicks spy_log update"
Ticket: "USERFEAT-1493"
Authors: ["skorodumov-s"]
Responsibles: ["skorodumov-s", "tarum"]
}
Factor {
Index: 492
CppName: "FI_YMW_FULL"
Name: "YmwFull"
Group: "CombinedAbs"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_REARR_USE, TG_DEPRECATED]
Description: "The size of the minimum piece of text that includes all query words in the document. It’s not being used now. ((<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/YMW> in more detail))"
Authors: "alsafr"
Responsibles: "alsafr"
}
Factor {
Index: 493
CppName: "FI_BCLM"
Name: "Bclm"
Group: "CombinedAbs"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_REARR_USE, TG_UNDOCUMENTED, TG_NN_OVER_FEATURES_USE]
Description: "The Buettcher, Clarke и Lushman name factor (modified) ((<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/BCLm> in more detail))"
Authors: "alsafr"
Responsibles: "alsafr"
}
Factor {
Index: 494
CppName: "FI_QUERY_COMMERCIALITY_MX"
Name: "QueryCommercialityMx"
DependsOn: [{Feature: ["QueryCommercialityMx"], Slice: "begemot_query_factors"}]
Ticket: "SEARCHSPAM-2317"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/QueryCommercialityMx>"
Group: "Query"
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_COMMERCIAL, TG_TRANS, TG_REARR_USE, TG_L2, TG_DEPRECATED]
Countries: [CNT_RU, CNT_TR]
Description: "A measure of the 'commerciality' of the query. It is a MatrixNet factor that’s complexly calculated by a formula based on the purchasing dictionary in direct + based ono the logs of user requests + add. intent dictionaries. The queries with a purchase intent gravitate toward ->1 product queries ->0.6 with an intent not to purchase, reviews and so on -> 0 ((<http://wiki.yandex-team.ru/AntonNeljubin/FaktorydljaNovogoKlassifikatorazaprosov> classifier factors))((<http://wiki.yandex-team.ru/JandeksPoisk/Antispam/AntiSEO/KlassifikatorKommercheskixZaprosov> more about it))"
Authors: ["anelyubin", "kvn"]
Responsibles: ["anelyubin", "kvn"]
DependsOn: [{Feature: ["QueryNonCommerciality", "TovarCategoryQuery", "TovarCategoryVendor", "IsNavQuery", "QClassDownload", "QClassBrandnames", "QClassDisease", "QClassKak", "QClassMoscow", "QClassOAO", "QClassPorno", "QClassTravel", "CountryPopularQ"]}]
}
Factor {
Index: 495
CppName: "FI_FIELD_LM"
Name: "FieldLM"
Group: "BM25F"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "Unigram language model. The language is modeled based on the document, smoothed by the general language model. When creating a model based on the document, we use information about in which field of the document the query word was found (Title, head or plain text)"
Authors: "ylogachev"
Responsibles: "ylogachev"
}
Factor {
Index: 496
CppName: "FI_GEO_CITY_URL_REGION_CITY"
Name: "GeoCityUrlRegionCity"
Ticket: "BUKI-1125"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/GeoCityUrl>"
Tags: [TG_DOC, TG_DYNAMIC, TG_LOCALIZED_CITY, TG_URL_TEXT, TG_BINARY, TG_REARR_USE, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The match of the geography determined by the URL of the document and the city of the query (ip or lr)"
Authors: "denplusplus"
Responsibles: "alsafr"
}
Factor {
Index: 497
CppName: "FI_GEO_CITY_URL_REGION_REGION"
Name: "GeoCityUrlRegionRegion"
Ticket: "BUKI-1125"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/GeoCityUrl>"
Tags: [TG_DOC, TG_DYNAMIC, TG_LOCALIZED_REGION, TG_URL_TEXT, TG_BINARY, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The match of the geography determined by the URL of the document and the city of the query (ip or lr)"
Authors: "denplusplus"
Responsibles: "alsafr"
}
Factor {
Index: 498
CppName: "FI_GEO_CITY_URL_REGION_COUNTRY"
Name: "GeoCityUrlRegionCountry"
Ticket: "BUKI-1125"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/GeoCityUrl>"
Tags: [TG_DOC, TG_DYNAMIC, TG_LOCALIZED_COUNTRY, TG_URL_TEXT, TG_BINARY, TG_REARR_USE, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The match of the geography determined by the URL of the document and the city of the query (ip or lr). Related to Russia and Ukraine."
Authors: "denplusplus"
Responsibles: "alsafr"
}
Factor {
Index: 499
CppName: "FI_GEO_CITY_URL_GEO_CITY_CITY"
Name: "GeoCityUrlGeoCityCity"
Ticket: "BUKI-1125"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/GeoCityUrl>"
Tags: [TG_DOC, TG_DYNAMIC, TG_LOCALIZED_GEOINQUERY, TG_URL_TEXT, TG_BINARY, TG_REARR_USE, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The match of the geography determined by the URL of the document and the city of the query (the GeoCity rule)"
Authors: "denplusplus"
Responsibles: "alsafr"
}
Factor {
Index: 500
CppName: "FI_PAY_APP_DETECTOR_PREDICT"
Name: "PayAppDetectorPredict"
Ticket: "COMMERCIAL-19"
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_USER, TG_L2, TG_QUERY_DETECTOR_PREDICT, TG_NOT_01, TG_UNUSED]
Description: "The value of the forked commerce detector calculated in Hippo (algorithm name)."
MinValue: -10
MaxValue: 10
Authors: ["alejes", "hygge"]
Responsibles: ["alejes", "hygge"]
ImplementationTime: "2020-08-01"
}
Factor {
Index: 501
CppName: "FI_TITLE_TRIGRAMS_Q"
Name: "TitleTrigramsQuery"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_REARR_USE, TG_UNDOCUMENTED, TG_NN_OVER_FEATURES_USE]
Description: "Calculates the query coverage of the document title by the letter trigrams"
Authors: "akorsun"
Responsibles: "alsafr"
}
Factor {
Index: 502
CppName: "FI_TITLE_TRIGRAMS_T"
Name: "TitleTrigramsTitle"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_REARR_USE, TG_UNDOCUMENTED, TG_NN_OVER_FEATURES_USE]
Description: "Calculates the heading coverage of the document title by the letter trigrams"
Authors: "akorsun"
Responsibles: "alsafr"
}
Factor {
Index: 503
CppName: "FI_INLINKS_MODEL"
Name: "InlinksModel"
Ticket: "COMBPROLAB-69"
Group: ["Xref", "Dynamic"]
Tags: [TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_UNUSED]
Description: "The probabilistic model that’s built on the texts of incoming links"
Authors: "grechnik"
Responsibles: "grechnik"
}
Factor {
Index: 504
CppName: "FI_QUERY_WORD_SEQUENCES_TR"
Name: "QueryWordSequencesTR"
Group: "QueryWordSequencesTR"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_NN_OVER_FEATURES_USE]
Description: "It calculates the sum of occurrences of the following type: a sequence of query words longer than two that are encountered in one sentence; normalized to document length."
Authors: "akorsun"
Responsibles: "alsafr"
}
Factor {
Index: 505
CppName: "FI_QUERY_WORD_SEQUENCES_LR"
Name: "QueryWordSequencesLR"
Group: "QueryWordSequencesLR"
Tags: [TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: "It calculates the sum of occurrences of the following type: a sequence of query words longer than two that are encountered in one link; normalized to a number of links.”
Authors: "akorsun"
Responsibles: "alsafr"
}
Factor {
Index: 506
CppName: "FI_OWNER_NAV_QUOTA"
Name: "OwnerNavQuota"
Tags: [TG_STATIC, TG_OWNER, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_REARR_USE, TG_OFTEN_ZERO, TG_L2, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_CLICKS_SHOWS, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Description: "The percentage of clicks from navigational queries"
Authors: "ulyanov"
Responsibles: ["ulyanov", "tarum", "niknik"]
}
Factor {
Index: 507
CppName: "FI_GEO_RELEV_ALIEN_CITY"
Name: "GeoRelevAlienCity"
Tags: [TG_DOC, TG_DYNAMIC, TG_LOCALIZED_CITY, TG_BINARY, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_L3_OVERWRITE, TG_NN_OVER_FEATURES_USE]
Description: "The result has a geo-reference that does not match the user's geography at the city level ([415]==1 && [215]==0)"
Authors: "esoloviev"
Responsibles: "esoloviev"
}
Factor {
Index: 508
CppName: "FI_GEO_V_QUERY_IN_USERS_CITY"
Name: "GeoVQueryInUserCity"
Tags: [TG_DOC, TG_DYNAMIC, TG_LOCALIZED_CITY, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "Geo-vitality of the query for results from the user's region"
Authors: "esoloviev"
Responsibles: "esoloviev"
}
Factor {
Index: 509
CppName: "FI_GEO_V_QUERY_IN_ALIEN_CITY"
Name: "GeoVQueryInAlienCity"
Tags: [TG_DOC, TG_DYNAMIC, TG_LOCALIZED_CITY, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "Geo-vitality of the query for results not from the user's region"
Authors: "esoloviev"
Responsibles: "esoloviev"
}
Factor {
Index: 510
CppName: "FI_HOST_RELIABILITY"
Name: "HostReliability"
Tags: [TG_HOST, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_DEPRECATED]
Description: "The percentage of URLs that respond without errors"
Responsibles: "alsafr"
}
Factor {
Index: 511
CppName: "FI_DMOZ_THEME_MATCH_ALL"
Name: "DmozThemeMatchAll"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_THEME_CLASSIF, TG_UNDOCUMENTED, TG_L2, TG_DEPRECATED]
Description: "The match of the topic spectrum (according to DMOZ) of the query and the document. The query topic is determined by ((<http://wiki.yandex-team.ru/JandeksPoisk/ZarubezhnyjjInternet/DMOZqueryClassifier1> by the sorcerer’s (algorithm) rule DMOZTheme )) The document topic is determined by an automatic classifier"
Authors: ["ekrokhalev", "pyal"]
Responsibles: ["pyal", "lamo"]
}
Factor {
Index: 512
CppName: "FI_DMOZ_THEME_MATCH_BEST"
Name: "DmozThemeMatchBest"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_THEME_CLASSIF, TG_UNDOCUMENTED, TG_L2, TG_DEPRECATED]
Description: "The match of the topic spectrum (according to DMOZ) of the query and the document. The query topic is determined by the best result ((<http://wiki.yandex-team.ru/JandeksPoisk/ZarubezhnyjjInternet/DMOZqueryClassifier1> the sorcerer’s (algorithm) rule DMOZTheme )) The document topic is determined by an automatic classifier"
Authors: ["ekrokhalev", "pyal"]
Responsibles: ["pyal", "lamo"]
}
Factor {
Index: 513
CppName: "FI_MPSA"
Name: "Mpsa"
Group: "CombinedAbs"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_REARR_USE, TG_UNDOCUMENTED, TG_NN_OVER_FEATURES_USE]
Description: "Estimates the minimum distance between pairs of query words, considering the distance between the pair and the beginning of the document (Minimal Pair Size with Attenuation). Pairs are considered as all consecutive bigrams of query words.. Thus, the number of pairs is equal to the number of words in the query minus 1. Accordingly, the factor makes sense for queries consisting of more than one word.((<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/MPSA> MPSA))"
Authors: "alsafr"
Responsibles: "alsafr"
}
Factor {
Index: 514
CppName: "FI_BCLM2"
Name: "Bclm2"
Group: "CombinedAbs"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_NN_OVER_FEATURES_USE]
Description: "Differs from BCLm by the fact that the weights of all words are assumed to be the same. ((<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/BCLm2> BCLm2))"
Authors: "alsafr"
Responsibles: "alsafr"
}
Factor {
Index: 515
CppName: "FI_ABSOLUTE_PLM"
Name: "AbsolutePLM"
Group: "CombinedAbs"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_NN_OVER_FEATURES_USE]
Description: "The text relevance is based on the language model, including the absolute position. We go through the text with the size (step) of 20 words, build a language model for each step (that is, a probability distribution of the words of the Russian language) and calculate the probability of generating a query. We penalize the model for deletion from the beginning of the document"
Authors: "kustarev"
Responsibles: "alsafr"
}
Factor {
Index: 516
CppName: "FI_PAGE_REGION_COVERAGE"
Name: "PageRegionCoverage"
Tags: [TG_DOC, TG_STATIC, TG_STATIC_REGINFO, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Authors: "denplusplus"
Responsibles: "alsafr"
}
Factor {
Index: 517
CppName: "FI_PAGE_REGION_SIZE"
Name: "PageRegionSize"
Tags: [TG_DOC, TG_STATIC, TG_STATIC_REGINFO, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_L3_OVERWRITE, TG_NN_OVER_FEATURES_USE]
Description: "The size of the page region"
Authors: "denplusplus"
Responsibles: "alsafr"
}
Factor {
Index: 518
CppName: "FI_PAGE_REGION_REL_COVERAGE"
Name: "PageRegionRelCoverage"
Tags: [TG_DOC, TG_STATIC, TG_STATIC_REGINFO, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_L3_OVERWRITE, TG_NN_OVER_FEATURES_USE]
Authors: "denplusplus"
Responsibles: "alsafr"
}
Factor {
Index: 519
CppName: "FI_RC_SPYLOG_FRESHNESS_AT_REQ"
Name: "RcSpylogFreshnessAtReq"
Group: "RapidClicks"
Tags: [TG_STATIC, TG_DOC, TG_USER, TG_BROWSER, TG_L2, TG_DATA_FROM_BIGRT, TG_UNDOCUMENTED, TG_SPYLOG_RAPID_CLICKS_BIGRT, TG_NN_OVER_FEATURES_USE]
Description: "Freshness of rapid clicks spy_log update, calculated at the request time"
Ticket: "USERFEAT-1493"
Authors: ["skorodumov-s"]
Responsibles: ["skorodumov-s", "tarum"]
ImplementationTime: "2020-09-01"
}
Factor {
Index: 520
CppName: "FI_QUERY_ISGEO"
Name: "IsGeo"
DependsOn: [{Feature: ["IsGeo"], Slice: "begemot_query_factors"}]
Ticket: "BUKI-1316"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/IsGeo>"
Group: "Query"
Tags: [TG_QUERY_ONLY, TG_DYNAMIC, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_DEPRECATED]
Description: "It sends the maximum weight of the query’s encountered geo object in the request to basic searches under the name isgeo. As a geo object, it’s considered to imply a category object Geo, Geo1, GeoAddr, GeoAddr1, LandMark, LandMark1 (see ((<http://wiki.yandex-team.ru/AlekseySokirko/QueryObjects> som markup))).((<http://wiki.yandex-team.ru/ArsenGadzhikurbanov/Wares> in more detail))"
Authors: "arseny"
Responsibles: "arseny"
}
Factor {
Index: 521
CppName: "FI_QUERY_ISMUSIC"
Name: "IsMusic"
DependsOn: [{Feature: ["IsMusic"], Slice: "begemot_query_factors"}]
Ticket: "BUKI-1316"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/IsMusic>"
Group: "Query"
Tags: [TG_QUERY_ONLY, TG_DYNAMIC, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_DEPRECATED]
Description: "It sends the maximum weight of the query’s encountered geo object in the Music or Music1 category to basic searches under the name ismusic. (see ((<http://wiki.yandex-team.ru/AlekseySokirko/QueryObjects> som markup))).((<http://wiki.yandex-team.ru/ArsenGadzhikurbanov/Wares> in more detail))"
Authors: "arseny"
Responsibles: "arseny"
}
Factor {
Index: 522
CppName: "FI_BCLM_LITE"
Name: "BclmLite"
Group: "BCLM"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_L2, TG_NO_L3, TG_NN_OVER_FEATURES_USE]
Description: "The modification of the Bclm2 factor that was simplified for use in fastrank. The main difference is that BclmLite does not use absolute word offsets relatively to the beginning of the document. Instead, the factor works with regular positions of the form <Sentence_number, Position_in_sentence>. At the same time, the proximity between words is taken into account only within the sentence..((<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/BCLmLite> BCLmLite))"
Authors: "alsafr"
Responsibles: "alsafr"
}
Factor {
Index: 523
CppName: "FI_QUERY_NEARBY"
Name: "NearbyQuery"
DependsOn: [{Feature: ["NearbyQuery"], Slice: "begemot_query_factors"}]
Group: "Query"
Tags: [TG_QUERY_ONLY, TG_DYNAMIC, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_DEPRECATED]
Description: "When answering a query, the results in the immediate proximity are important ([pharmacies], [children's clinics])"
Authors: "esoloviev"
Responsibles: "esoloviev"
}
Factor {
Index: 524
CppName: "FI_QUERY_CITY"
Name: "CityQuery"
DependsOn: [{Feature: ["CityQuery"], Slice: "begemot_query_factors"}]
Group: "Query"
Tags: [TG_QUERY_ONLY, TG_DYNAMIC, TG_UNDOCUMENTED, TG_L2, TG_REARR_USE, TG_DEPRECATED]
Description: "When answering a query, the results within the city are important (the bulk of localizable queries)"
Authors: "esoloviev"
Responsibles: "esoloviev"
}
Factor {
Index: 525
CppName: "FI_QUERY_ADM"
Name: "AdmQuery"
DependsOn: [{Feature: ["AdmQuery"], Slice: "begemot_query_factors"}]
Group: "Query"
Tags: [TG_QUERY_ONLY, TG_DYNAMIC, TG_UNDOCUMENTED, TG_L2, TG_REARR_USE, TG_DEPRECATED]
Description: "When answering a query, the results from the user’s area and region are important ([airport], [dairy factory])"
Authors: "esoloviev"
Responsibles: "esoloviev"
}
Factor {
Index: 526
CppName: "FI_NUM_LINKS_FROM_MP"
Name: "NumLinksFromMP"
Tags: [TG_DOC, TG_LINK_GRAPH, TG_STATIC, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_DEPRECATED]
Description: "The number of incoming links from homepages"
Authors: "vvp"
Responsibles: "alsafr"
}
Factor {
Index: 527
CppName: "FI_YMW_FULL2"
Name: "YmwFull2"
Group: "CombinedAbs"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_REARR_USE, TG_UNDOCUMENTED, TG_NN_OVER_FEATURES_USE]
Description: "A fixed YmwFull. It differs from the previous version only by its behavior on 2-word queries. ((<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/YMW> in more detail))"
Authors: "alsafr"
Responsibles: "alsafr"
}
Factor {
Index: 528
CppName: "FI_FULL_QUORUM"
Name: "FullQuorum"
Group: "Dynamic"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_REARR_USE, TG_DEPRECATED]
Description: "Binary factor, each query word exists in the text or in the links"
Authors: "denplusplus"
Responsibles: "alsafr"
}
Factor {
Index: 529
CppName: "FI_AUXC_TEXT_BM25"
Name: "AuxCTextBM25"
AntiSeoUpperBound: 0.8
Group: "AuxBM25"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_LOCALIZED_COUNTRY, TG_UNUSED, TG_OFTEN_ZERO]
Description: "uses 'country aux tree' (auxqc)"
Authors: "shutovich"
Responsibles: "shutovich"
}
Factor {
Index: 530
CppName: "FI_AUXC_LINK_BM25"
Name: "AuxCLinkBM25"
AntiSeoUpperBound: 0.8
Group: "AuxBM25"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_LOCALIZED_COUNTRY, TG_UNUSED, TG_OFTEN_ZERO]
Description: "uses 'country aux tree' (auxqc)"
Authors: "shutovich"
Responsibles: "shutovich"
}
Factor {
Index: 531
CppName: "FI_SOFT_404"
Name: "Soft404"
Ticket: "ARC-1046"
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "Page — '404' (the percentage of '404' tokens in relation to the total number of tokens on the page)"
Authors: "avatar"
Responsibles: "avatar"
}
Factor {
Index: 532
CppName: "FI_RC_SPYLOG_URL_RATIONAL_SIGMOID_D1T240_AT_REQ"
Name: "RcSpylogUrlRationalSigmoidD1T240AtReq"
Group: "RapidClicks"
Tags: [TG_STATIC, TG_DOC, TG_USER, TG_BROWSER, TG_L2, TG_DATA_FROM_BIGRT, TG_UNDOCUMENTED, TG_SPYLOG_RAPID_CLICKS_BIGRT, TG_NN_OVER_FEATURES_USE]
Description: "URL feature computed at the request time from rapid clicks spy_log counters with decay of 1 day"
Ticket: "USERFEAT-1493"
Authors: ["skorodumov-s"]
Responsibles: ["skorodumov-s", "tarum"]
ImplementationTime: "2020-09-01"
}
Factor {
Index: 533
CppName: "FI_DBM25"
Name: "DBM25"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/DBM25>"
Group: "DBM25"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: "BM25, in which the word weight is machine-matched"
Authors: "denplusplus"
Responsibles: "alsafr"
}
Factor {
Index: 534
CppName: "FI_QUERY_WORD_COHESION_TR"
Name: "QueryWordCohesionTR"
Group: "CombinedAbs"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_NN_OVER_FEATURES_USE]
Description: "The factor evaluates how query words are grouped with each other in the document text regardless their order. ((<http://wiki.yandex-team.ru/SergejjKrylov/QueryWordCohesionTR> description))"
Authors: "kryloff"
Responsibles: "kryloff"
}
Factor {
Index: 535
CppName: "FI_OWNER_SESS_NORM_DUR_REG"
Name: "OwnerSessNormDuration_Reg"
Group: "RegHostStatic"
Tags: [TG_STATIC, TG_OWNER, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_L2, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_90D, TG_USERFEAT_USF, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Countries: CNT_RELEV
Description: "nd/k normalized time before the click"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty#polzovatelskiesessii>"
Authors: ["cliff", "akhropov", "angshu"]
Responsibles: ["tarum", "niknik"]
}
Factor {
Index: 536
CppName: "FI_RC_SPYLOG_URL_RATIONAL_SIGMOID_D0_5T30_AT_REQ"
Name: "RcSpylogUrlRationalSigmoidD0_5T30AtReq"
Group: "RapidClicks"
Tags: [TG_STATIC, TG_DOC, TG_USER, TG_BROWSER, TG_L2, TG_DATA_FROM_BIGRT, TG_UNDOCUMENTED, TG_SPYLOG_RAPID_CLICKS_BIGRT, TG_NN_OVER_FEATURES_USE]
Description: "URL feature computed at the request time from rapid clicks spy_log counters with decay of 0.5 days"
Ticket: "USERFEAT-1493"
Authors: ["skorodumov-s"]
Responsibles: ["skorodumov-s", "tarum"]
ImplementationTime: "2020-09-01"
}
Factor {
Index: 537
CppName: "FI_QUERY_DOWNER_SESS_NORM_DUR_REG"
Name: "QueryDOwnerSessNormDuration_Reg"
Tags: [TG_DYNAMIC, TG_DOWNER, TG_LOCALIZED_REGION, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_USER_SEARCH_EXTERNAL, TG_UNDOCUMENTED, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_90D, TG_USERFEAT_USF, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Description: "nd/k"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty#polzovatelskiesessii>"
Authors: ["cliff", "akhropov", "angshu"]
Responsibles: ["tarum", "niknik"]
}
Factor {
Index: 538
CppName: "FI_QUERY_DOWNER_WEIGHT_CLICK_REG"
Name: "QueryDOwnerWeightClick_Reg"
Tags: [TG_DYNAMIC, TG_DOWNER, TG_LOCALIZED_REGION, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_USER_SEARCH_EXTERNAL, TG_UNDOCUMENTED, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_90D, TG_USERFEAT_USF, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Description: "w/k"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty#polzovatelskiesessii>"
Authors: ["cliff", "akhropov", "angshu"]
Responsibles: ["tarum", "niknik"]
}
Factor {
Index: 539
CppName: "FI_QUERY_DOWNER_ONLY_CLICK_RATE_REG"
Name: "QueryDOwnerOnlyClickRate_Reg"
Tags: [TG_DYNAMIC, TG_DOWNER, TG_LOCALIZED_REGION, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_USER_SEARCH_EXTERNAL, TG_UNDOCUMENTED, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_90D, TG_USERFEAT_USF, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Description: "o/i"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty#polzovatelskiesessii>"
Authors: ["cliff", "akhropov", "angshu"]
Responsibles: ["tarum", "niknik"]
}
Factor {
Index: 540
CppName: "FI_QUERY_DOWNER_CLICK_SUMMARY_REG"
Name: "QueryDOwnerClickSummary_Reg"
Ticket: "BUKI-955"
Tags: [TG_DYNAMIC, TG_DOWNER, TG_LOCALIZED_REGION, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_USER_SEARCH_EXTERNAL, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_90D, TG_USERFEAT_USF, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Description: "a selected formula"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty#polzovatelskiesessii>"
Authors: ["popescul", "cliff", "angshu", "akhropov"]
Responsibles: ["tarum", "niknik"]
}
Factor {
Index: 541
CppName: "FI_QUERY_DOWNER_SATISFIED4_RATE_REG"
Name: "QueryDOwnerSatisfied4Rate_Reg"
Ticket: "BUKI-955"
Tags: [TG_DYNAMIC, TG_DOWNER, TG_LOCALIZED_REGION, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_USER_SEARCH_EXTERNAL, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_90D, TG_USERFEAT_USF, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Description: "r_s4b/(r_k + 10)"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty#polzovatelskiesessii>"
Authors: ["popescul", "cliff", "angshu", "akhropov"]
Responsibles: ["tarum", "niknik"]
}
Factor {
Index: 542
CppName: "FI_SEGMENT_AUX_ALPHAS_IN_TEXT"
Name: "SegmentAuxAlphasInText"
Ticket: "BUKI-1109"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/SegmentAuxAlphasInText>"
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The number of letters in the Aux segment"
Authors: "avatar"
Responsibles: "avatar"
}
Factor {
Index: 543
CppName: "FI_SEGMENT_AUX_SPACES_IN_TEXT"
Name: "SegmentAuxSpacesInText"
Ticket: "BUKI-1109"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/SegmentAuxSpacesInText>"
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The number of spaces in the Aux segment"
Authors: "avatar"
Responsibles: "avatar"
}
Factor {
Index: 544
CppName: "FI_SEGMENT_CONTENT_COMMAS_IN_TEXT"
Name: "SegmentContentCommasInText"
Ticket: "BUKI-1109"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/SegmentContentCommasInText>"
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The number of commas in the Content segment"
Authors: "avatar"
Responsibles: "avatar"
}
Factor {
Index: 545
CppName: "FI_CLASSIF_IS_SHOP"
Name: "IsShop"
Ticket: "BUKI-1128"
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_DEPRECATED, TG_L2]
Description: "The shop page. ((<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/OpisanijaFaktorov#isshop> description)). It is not being used (deprecated)"
Authors: "smikler"
Responsibles: "smikler"
}
Factor {
Index: 546
CppName: "FI_LR_GEO_RELEV_REGION_NATDOM"
Name: "XLRGeoRelevRegionNatDomain"
Group: "Xref"
Tags: [TG_DYNAMIC, TG_LOCALIZED_COUNTRY, TG_LINK_GRAPH, TG_UNDOCUMENTED, TG_LINK_TEXT, TG_DEPRECATED]
Authors: "agorodilov"
Responsibles: "agorodilov"
}
Factor {
Index: 547
CppName: "FI_AURA_DOC_LOG_ORIGIN"
Name: "AuraDocLogOrigin"
Tags: [TG_DOC_TEXT, TG_OWNER, TG_STATIC, TG_REARR_USE, TG_UNUSED, TG_OFTEN_ZERO, TG_DEPRECATED]
Description: "The logarithm of the number of shingles in a document added by the website owner as original texts in ((<http://wiki.yandex-team.ru/JandeksPoisk/Jekosistema/MarketingPR/Webmasters/plan/vtorcontect> Originality Plugin)). It’s not needed in the formula; it is needed for re-ranking of the duplicates"
Authors: "antonovvk"
Responsibles: ["antonovvk", "smax"]
}
Factor {
Index: 548
CppName: "FI_AURA_DOC_MEAN_FLT_AUTHOR_SOURCE"
Name: "AuraDocMeanFltAuthorSource"
Tags: [TG_DOC_TEXT, TG_OWNER, TG_STATIC, TG_UNUSED, TG_DEPRECATED]
Description: "Average filtered number of document authorship sources. It’s not needed in the formula; it is needed for re-ranking of the duplicates"
Authors: "antonovvk"
Responsibles: ["antonovvk", "smax"]
}
Factor {
Index: 549
CppName: "FI_QUERY_REF_TRIGRAM_Q"
Name: "QueryRefTrigramQuery"
Ticket: "BUKI-1117"
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: "((<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/OpisanijaFaktorov#queryreftrigrams> description))"
Authors: "vvp"
Responsibles: ["mbusel", "tsimkha"]
}
Factor {
Index: 550
CppName: "FI_QUERY_REF_TRIGRAM_R"
Name: "QueryRefTrigramReferences"
Ticket: "BUKI-1117"
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: "((<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/OpisanijaFaktorov#queryreftrigrams> description))"
Authors: "vvp"
Responsibles: ["mbusel", "tsimkha"]
}
Factor {
Index: 551
CppName: "FI_IDF_VARIANCE"
Name: "IdfVariance"
Group: "Dynamic"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_NN_OVER_FEATURES_USE]
Description: "IDF dispersion of query words given the presence of text hits in the document (mixed query-text factor)."
Authors: "grechnik"
Responsibles: "grechnik"
}
Factor {
Index: 552
CppName: "FI_URL_NGRAMS_MODEL"
Name: "UrlNGramsModel"
Ticket: "BUKI-1145"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/UrlNGramsModel>"
Tags: [TG_DOC, TG_STATIC, TG_URL_TEXT, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "UrlNGramsModel ranking factor in ERF."
Authors: "avatar"
Responsibles: "avatar"
}
Factor {
Index: 553
CppName: "FI_NATIONAL_LANGUAGE"
Name: "NationalLanguage"
Tags: [TG_LOCALIZED_COUNTRY, TG_DYNAMIC, TG_DOC_TEXT, TG_BINARY, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_L3_OVERWRITE, TG_NN_OVER_FEATURES_USE]
Description: "Document language is the same as the query’s country."
Authors: "dremov"
Responsibles: "dremov"
}
Factor {
Index: 554
CppName: "FI_OWNER_IS_COMMERCIAL"
Name: "OwnerIsCommercial"
Ticket: "SEARCHSPAM-2603"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/HostIsCommercial>"
Tags: [TG_STATIC, TG_OWNER, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_COMMERCIAL, TG_OFTEN_ZERO, TG_L2, TG_DEPRECATED]
Authors: ["anelyubin", "sisoid"]
Responsibles: ["anelyubin", "sisoid"]
}
Factor {
Index: 555
CppName: "FI_GEO_COUNTRY_URL_REGION_COUNTRY"
Name: "GeoCountryUrlRegionCountry"
Tags: [TG_DOC, TG_DYNAMIC, TG_LOCALIZED_COUNTRY, TG_URL_TEXT, TG_BINARY, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Authors: "denplusplus"
Responsibles: "alsafr"
}
Factor {
Index: 556
CppName: "FI_GEO_COUNTRY_URL_GEO_COUNTRY"
Name: "GeoCountryUrlGeoCountry"
Tags: [TG_DOC, TG_DYNAMIC, TG_LOCALIZED_GEOINQUERY, TG_URL_TEXT, TG_BINARY, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Authors: "denplusplus"
Responsibles: "alsafr"
}
Factor {
Index: 557
CppName: "FI_NUM_LINKS_FROM_SEGMENT_CONTENT"
Name: "NumLinksFromSegmentContent"
Ticket: "BUKI-1161"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/NumLinksFromSegmentContent>"
Group: "Xref"
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_DEPRECATED]
Authors: "vvp"
Responsibles: "alsafr"
}
Factor {
Index: 558
CppName: "FI_LOCM"
Name: "Locm"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/Locm>"
Group: "Xref"
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: "Order of words in links."
Authors: "alsafr"
Responsibles: "alsafr"
}
Factor {
Index: 559
CppName: "FI_URL_QUERY_VARIETY_REG"
Name: "UrlQueryVariety_Reg"
Ticket: "BUKI-1159"
Group: "RegDocStatic"
Tags: [TG_STATIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_L2, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_90D, TG_USERFEAT_CLICKS_SHOWS, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Countries: CNT_RELEV
Description: "The level of query diversity, based on which the URL is clicked, is calculated by regions."
Wiki: "<https://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/Kliki#urlqueryvarietyreg>"
Authors: "akhropov"
Responsibles: ["tarum", "niknik"]
}
Factor {
Index: 560
CppName: "FI_URL_SESS_NORM_DUR_RATE_REG"
Name: "UrlSessNormDurRate_Reg"
Ticket: "BUKI-1159"
Group: "RegDocStatic"
Tags: [TG_STATIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_L2, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_90D, TG_USERFEAT_USF, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Countries: CNT_RELEV
Description: "nd/i"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty#polzovatelskiesessii>"
Authors: ["cliff", "akhropov", "angshu"]
Responsibles: ["tarum", "niknik"]
}
Factor {
Index: 561
CppName: "FI_FILTRATION_SEGMENTS"
Name: "FiltrationSegments"
Group: "CombinedAbs"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_REARR_USE, TG_NN_OVER_FEATURES_USE]
Description: "The portion of query segments present in the text."
Authors: "denplusplus"
Responsibles: "alsafr"
}
Factor {
Index: 562
CppName: "FI_LANGUAGE_GOOD_FOR_TURKEY"
Name: "LanguageGoodForTurkey"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The document language is one of the acceptable languages for Turkey (Turkish, English, German, French, Arabic, Azerbaijani) or the document has a zero length. It is only calculated on the search stage for IsRealGeoLocal queries."
Authors: "dremov"
Responsibles: "dremov"
}
Factor {
Index: 563
CppName: "FI_DBM25_2"
Name: "DBM25_2"
Group: "DBM25"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_REARR_USE, TG_NN_OVER_FEATURES_USE]
Description: "Variation on the topic ((<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/DBM25> DBM25)), см. ysite/yandex/relevance/dbm25.cpp"
Authors: "denplusplus"
Responsibles: "alsafr"
}
Factor {
Index: 564
CppName: "FI_GEO_DISPERSION"
Name: "GeoDispersion"
Tags: [TG_DOC, TG_LINK_GRAPH, TG_STATIC, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_UNUSED]
Description: "Dispersion of regions of links pointing out to the document."
Authors: "bochkarev"
Responsibles: "bochkarev"
}
Factor {
Index: 565
CppName: "FI_QUERY_DOWNER_ENOUGH_CLICKED"
Name: "QueryDownerEnoughClicked"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/QueryDownerEnoughClicked>"
Tags: [TG_DYNAMIC, TG_DOWNER, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_USER_SEARCH_EXTERNAL, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_USF, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Description: "The number of clicks on the owner and the number of clicks on the query are more than 5."
Authors: ["snailer", "akhropov"]
Responsibles: ["tarum", "niknik"]
}
Factor {
Index: 566
CppName: "FI_BM25F_DPR_FIXED"
Name: "BM25FdPRFixed"
Group: "BM25F"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_L2, TG_LINK_TEXT, TG_DEPRECATED]
Description: "BM25FdPR with normalization based on the average document length, dependent on document language. (Testing results: <http://wiki.yandex-team.ru/BM25FRework>))"
Authors: "lamo"
Responsibles: "lamo"
}
Factor {
Index: 567
CppName: "FI_LANG_POPULARITY"
Name: "LanguagePopularity"
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "Popularity of document language. A number from 0 to 1. ((<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/LanguagePopularity> LanguagePopularity))"
Authors: "lamo"
Responsibles: "lamo"
}
Factor {
Index: 568
CppName: "FI_QUERY_DOWNER_WS_FRC_AND_BM25F_DPR_FIXED"
Name: "QueryDOwnerWeightedSumFRCAndBM25FdPRFixed"
Tags: [TG_DEPRECATED, TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_DOWNER, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_DOC_TEXT, TG_TRANS, TG_USER_SEARCH_EXTERNAL, TG_UNUSED, TG_L2]
Countries: CNT_RELEV
Description: "The sum of the factors QueryDOwnerClicksFRC and BM25FdPRFixed with weights 0.358449 and 0.184922 respectively. The number '565' in the factor name should not be taken as it is, it is either legacy or a typo."
Authors: ["grechnik", "kustarev"]
Responsibles: "grechnik"
DependsOn: [{Feature: ["QueryDOwnerClicksFRC", "BM25FdPRFixed"]}]
}
Factor {
Index: 569
CppName: "FI_QUERY_DOWNER_WS_MAX_WHR_AND_ONLY_CLICK_RATE"
Name: "QueryDOwnerWeightedSumMaxWHRAndOnlyClickRate"
Tags: [TG_DEPRECATED, TG_DYNAMIC, TG_DOWNER, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_TRANS, TG_USER_SEARCH_EXTERNAL, TG_UNUSED]
Countries: CNT_RELEV
Description: "This is the weighted sum of factors 192 and 341 with weights 0.298942 and 0.454625 respectively."
Authors: ["grechnik", "kustarev"]
Responsibles: "grechnik"
DependsOn: [{Feature: ["MaxWordHostRank", "QueryDOwnerOnlyClickRate"]}]
}
Factor {
Index: 570
CppName: "FI_RC_SPYLOG_URL_RATIONAL_SIGMOID_D3T120_AT_REQ"
Name: "RcSpylogUrlRationalSigmoidD3T120AtReq"
Group: "RapidClicks"
Tags: [TG_STATIC, TG_DOC, TG_USER, TG_BROWSER, TG_L2, TG_DATA_FROM_BIGRT, TG_UNDOCUMENTED, TG_SPYLOG_RAPID_CLICKS_BIGRT, TG_NN_OVER_FEATURES_USE]
Description: "URL feature computed at the request time from rapid clicks spy_log counters with decay of 3 days"
Ticket: "USERFEAT-1493"
Authors: ["skorodumov-s"]
Responsibles: ["skorodumov-s", "tarum"]
ImplementationTime: "2020-09-01"
}
Factor {
Index: 571
CppName: "FI_RC_SPYLOG_URL_RATIONAL_SIGMOID_D14T300_AT_REQ"
Name: "RcSpylogUrlRationalSigmoidD14T300AtReq"
Group: "RapidClicks"
Tags: [TG_STATIC, TG_DOC, TG_USER, TG_BROWSER, TG_L2, TG_DATA_FROM_BIGRT, TG_UNDOCUMENTED, TG_SPYLOG_RAPID_CLICKS_BIGRT, TG_NN_OVER_FEATURES_USE]
Description: "URL feature computed at the request time from rapid clicks spy_log counters with decay of 14 days"
Ticket: "USERFEAT-1493"
Authors: ["skorodumov-s"]
Responsibles: ["skorodumov-s", "tarum"]
ImplementationTime: "2020-09-01"
}
Factor {
Index: 572
CppName: "FI_TOCM"
Name: "Tocm"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/Tocm>"
Group: "Tocm"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_NN_OVER_FEATURES_USE]
Description: "The factor evaluates the differences in the positions of words in the title from the positions of words in the query."
Authors: "alsafr"
Responsibles: "alsafr"
}
Factor {
Index: 573
CppName: "FI_RELEV_GEO_LINKS_PERCENT"
Name: "RelevGeoLinksPercent"
Tags: [TG_DOC, TG_DYNAMIC, TG_LOCALIZED_CITY, TG_LINK_GRAPH, TG_UNDOCUMENTED, TG_UNUSED]
Authors: "denplusplus"
Responsibles: "alsafr"
}
Factor {
Index: 574
CppName: "FI_LANG_DISPERSION"
Name: "LangDispersion"
Ticket: "BUKI-1228"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/LangDispersion>"
Tags: [TG_DOC, TG_LINK_GRAPH, TG_STATIC, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_UNUSED]
Description: "Variance of languages in xmap."
Authors: "kartynnik"
Responsibles: "kartynnik"
}
Factor {
Index: 575
CppName: "FI_HAS_MISSPELL"
Name: "HasMisspell"
DependsOn: [{Feature: ["HasMisspell"], Slice: "begemot_query_factors"}]
Group: "Query"
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_UNDOCUMENTED, TG_L2, TG_DEPRECATED]
Description: "There is a typo in the query."
Authors: "denplusplus"
Responsibles: "alsafr"
}
Factor {
Index: 576
CppName: "FI_DBM30_SMERCH"
Name: "DBM30Smerch"
Group: "DBM25"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_NN_OVER_FEATURES_USE]
Description: "The variation on the topic ((<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/DBM25> DBM25)), см. ysite/yandex/relevance/dbm25.cpp"
Authors: "denplusplus"
Responsibles: "alsafr"
}
Factor {
Index: 577
CppName: "FI_IS_URL_FOR_CLICK_DEBOOST"
Name: "IsUrlForClickDeboost"
Tags: [TG_STATIC, TG_DOC, TG_UNUSED, TG_OFTEN_ZERO, TG_REARR_USE, TG_DATA_FROM_SAASKV, TG_USED_IN_CONF_REARR]
Authors: "hommforever"
Responsibles: ["hommforever", "ilnurkh"]
Description: "URL shows up too frequently with very low relevancy (according to Bert and/or BM25)."
ImplementationTime: "2021-01-12"
}
Factor {
Index: 578
CppName: "FI_URL_LINK_PERCENT"
Name: "UrlLinkPercent"
Ticket: "BUKI-1233"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/UrlLinkPercent>"
Tags: [TG_DOC, TG_LINK_GRAPH, TG_STATIC, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_UNUSED]
Description: "This factor evaluates the ratio of the number of incoming links that have a text of a URL, to the total number of incoming links."
Authors: "suncpp"
Responsibles: "alsafr"
}
Factor {
Index: 579
CppName: "FI_DSSM_BERT_DISTILL_L2"
Name: "DssmBertDistillL2"
Tags: [TG_DYNAMIC, TG_DOC, TG_USER, TG_USER_SEARCH, TG_URL_TEXT, TG_DOC_TEXT, TG_NEURAL, TG_USE_MARKUP, TG_ALL_RELEVANCE_MARKUP, TG_SIN_SIG_MARKUP, TG_BERT_DISTILL, TG_L2]
Description: "A set of PRS logs by using Bert trained on sinsig, and a dssm model is trained on this set using BaseRegionChain."
UseArtifact: {Name: "DssmBertDistillL2"}
Ticket: "BERT-179"
Authors: ["filmih"]
Responsibles: ["filmih"]
ImplementationTime: "2020-08-30"
}
Factor {
Index: 580
CppName: "FI_NUM_NON_LETTERS_IN_URL"
Name: "NumNonLettersInUrl"
Ticket: "BUKI-1238"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/NumNonLettersInUrl>"
Tags: [TG_DOC, TG_STATIC, TG_URL_TEXT, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The number of non-letters in the URL."
Authors: "kartynnik"
Responsibles: "kartynnik"
}
Factor {
Index: 581
CppName: "FI_URL_LENGTH_2"
Name: "UrlLen2"
Tags: [TG_DOC, TG_STATIC, TG_URL_TEXT, TG_UNUSED, TG_L2]
Ticket: "BUKI-1252"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/UrlLen2>"
Description: "The length of the URL, accurate to the symbol, is not used in production."
Authors: "kartynnik"
Responsibles: "kartynnik"
}
Factor {
Index: 582
CppName: "FI_IS_HUB"
Name: "IsHub"
Ticket: "BUKI-1257"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/IsHub>"
Tags: [TG_DOC, TG_STATIC, TG_BINARY, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_NN_OVER_FEATURES_USE]
Description: "Is it a hub page? (Pillar page?)"
Authors: "suncpp"
Responsibles: "alsafr"
}
Factor {
Index: 583
CppName: "FI_STATIC_TITLE_COMM"
Name: "StaticTitleComm"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/StaticTitleComm>"
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_DEPRECATED, TG_OFTEN_ZERO]
Description: "The degree of commercialization of the page's header. Not used (deprecated)."
Authors: "zosimov"
Responsibles: "zosimov"
}
Factor {
Index: 584
CppName: "FI_STATIC_TITLE_BM25_EX"
Name: "StaticTitleBM25Ex"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/StaticTitleBM25Ex>"
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "BM25 score of a page's header based on its text."
Authors: "zosimov"
Responsibles: "zosimov"
}
Factor {
Index: 585
CppName: "FI_STATIC_TITLE_LR_BM25"
Name: "StaticTitleLRBM25"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/StaticTitleLRBM25>"
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_UNUSED]
Description: "BM25 of page header based on texts of incoming links."
Authors: "zosimov"
Responsibles: "zosimov"
}
Factor {
Index: 586
CppName: "FI_SEO_IN_PAY_LINKS"
Name: "SeoInPayLinks"
Ticket: "BUKI-1243"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/SeoInPayLinks>"
Tags: [TG_DOC, TG_LINK_GRAPH, TG_STATIC, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_UNUSED]
Description: "The number of incoming bad links between hosts."
Authors: "suncpp"
Responsibles: "alsafr"
}
Factor {
Index: 587
CppName: "FI_US_LONG_PERIOD_URL_MOBILE_DT180_AVG"
Name: "USLongPeriodUrlMobileDt180Avg"
Ticket: ["FACTOR-1129"]
Tags: [TG_DOC, TG_STATIC, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_1600D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_SEARCH_DWELL_TIME, TG_USERFEAT_CLICK_MACHINE]
Description: "Static URL factor based on 1600 days of search sessions calculated from mobile sessions, with average DwellTime, where the DwellTime from a session is cut if it is over 180 seconds."
Wiki: "<https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/USLongPeriodUrlFactors>"
Authors: ["edik"]
Responsibles: ["edik", "tarum", "niknik"]
}
Factor {
Index: 588
CppName: "FI_US_LONG_PERIOD_URL_MOBILE_LONG_CLICK_PROB"
Name: "USLongPeriodUrlMobileLongClickProb"
Ticket: ["FACTOR-1129"]
Tags: [TG_DOC, TG_STATIC, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_1600D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_SEARCH_DWELL_TIME, TG_USERFEAT_CLICK_MACHINE]
Description: "Static URL factor based on 1600 days of search sessions calculated from mobile sessions. Probability of a click on the URL will be over 120 seconds."
Wiki: "<https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/USLongPeriodUrlFactors>"
Authors: ["edik"]
Responsibles: ["edik", "tarum", "niknik"]
}
Factor {
Index: 589
CppName: "FI_US_LONG_PERIOD_URL_MOBILE_LOSSES_PROB"
Name: "USLongPeriodUrlMobileLossesProb"
Ticket: ["FACTOR-1129"]
Tags: [TG_DOC, TG_STATIC, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_1600D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_CLICK_MACHINE]
Description: "Static URL factor calculated from search sessions over 1600 days based on mobile sessions. Probability of the URL will not be clicked if at least one lower URL is clicked."
Wiki: "<https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/USLongPeriodUrlFactors>"
Authors: ["edik"]
Responsibles: ["edik", "tarum", "niknik"]
}
Factor {
Index: 590
CppName: "FI_US_LONG_PERIOD_URL_MOBILE_DT3600_AVG_REG"
Name: "USLongPeriodUrlMobileDt3600AvgReg"
Ticket: ["FACTOR-1129"]
Tags: [TG_DOC, TG_STATIC, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_LOCALIZED_COUNTRY, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_1600D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_SEARCH_DWELL_TIME, TG_USERFEAT_CLICK_MACHINE]
Countries: CNT_RELEV
Description: "Static URL factor based on search sessions over 1600 days calculated using mobile sessions. Average DwellTime, with DwellTime cut off from the session if it's over 3600 seconds. Localization down to country level."
Group: "RegDocStatic"
Wiki: "<https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/USLongPeriodUrlFactors>"
Authors: ["edik"]
Responsibles: ["edik", "tarum", "niknik"]
}
Factor {
Index: 591
CppName: "FI_US_LONG_PERIOD_URL_MOBILE_DT180_AVG_REG"
Name: "USLongPeriodUrlMobileDt180AvgReg"
Ticket: ["FACTOR-1129"]
Tags: [TG_DOC, TG_STATIC, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_LOCALIZED_COUNTRY, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_1600D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_SEARCH_DWELL_TIME, TG_USERFEAT_CLICK_MACHINE]
Countries: CNT_RELEV
Description: "Static URL factor calculated for 1600 days of search sessions based on mobile sessions. Average DwellTime, with DwellTime from the session being cut if more than 180 seconds. Localization to the country level."
Group: "RegDocStatic"
Wiki: "<https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/USLongPeriodUrlFactors>"
Authors: ["edik"]
Responsibles: ["edik", "tarum", "niknik"]
}
Factor {
Index: 592
CppName: "FI_HP_DETECTOR_PREDICT"
Name: "HpDetectorPredict"
Ticket: "COMMERCIAL-45"
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_USER, TG_L2, TG_QUERY_DETECTOR_PREDICT, TG_NOT_01, TG_UNUSED]
Description: "The value of the health detector, calculated in Hippo (algorithm name)."
MinValue: -10
MaxValue: 10
Authors: ["alejes", "hygge"]
Responsibles: ["alejes", "hygge"]
ImplementationTime: "2020-09-25"
}
Factor {
Index: 593
CppName: "FI_IS_FEED_LISTING"
Name: "IsFeedListing"
Ticket: "SEARCHSPAM-15486"
Authors: ["bikulov"]
Responsibles: ["bikulov", "ulyanov"]
Description: "OffersBase feature for ecoboost."
Tags: [TG_DOC, TG_STATIC, TG_BINARY, TG_OFTEN_ZERO, TG_META_OVERWRITE, TG_UNUSED, TG_DATA_FROM_SAASKV, TG_UNIMPLEMENTED],
}
Factor {
Index: 594
CppName: "FI_IS_FEED_MAIN"
Name: "IsFeedMain"
Ticket: "SEARCHSPAM-15486"
Authors: ["bikulov"]
Responsibles: ["bikulov", "ulyanov"]
Description: "OffersBase feature for ecoboost."
Tags: [TG_DOC, TG_STATIC, TG_BINARY, TG_OFTEN_ZERO, TG_META_OVERWRITE, TG_UNUSED, TG_DATA_FROM_SAASKV, TG_UNIMPLEMENTED],
}
Factor {
Index: 595
CppName: "FI_IS_FEED_STRATOCASTER"
Name: "IsFeedStratocaster"
Ticket: "SEARCHSPAM-15486"
Authors: ["bikulov"]
Responsibles: ["bikulov", "ulyanov"]
Description: "OffersBase feature for ecoboost."
Tags: [TG_DOC, TG_STATIC, TG_BINARY, TG_OFTEN_ZERO, TG_META_OVERWRITE, TG_UNUSED, TG_DATA_FROM_SAASKV, TG_UNIMPLEMENTED],
}
Factor {
Index: 596
CppName: "FI_IS_FEED_ANY"
Name: "IsFeedAny"
Ticket: "SEARCHSPAM-15486"
Authors: ["bikulov"]
Responsibles: ["bikulov", "ulyanov"]
Description: "OffersBase feature for ecoboost."
Tags: [TG_DOC, TG_STATIC, TG_BINARY, TG_OFTEN_ZERO, TG_META_OVERWRITE, TG_UNUSED, TG_DATA_FROM_SAASKV, TG_UNIMPLEMENTED],
}
Factor {
Index: 597
CppName: "FI_TITLE_IN_LINKS_TRIGRAMS"
Name: "TitleInLinksTrigrams"
Ticket: "BUKI-1264"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/titleinlinkstrigrams>"
Tags: [TG_DOC, TG_DOC_TEXT, TG_LINK_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_UNUSED]
Description: "The ratio of unique trigrams in the title to the trigrams in the links."
Authors: "morph"
Responsibles: "morph"
}
Factor {
Index: 598
CppName: "FI_LINKS_IN_TITLE_TRIGRAMS"
Name: "LinksInTitleTrigrams"
Ticket: "BUKI-1264"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/titleinlinkstrigrams>"
Tags: [TG_DOC, TG_DOC_TEXT, TG_LINK_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_UNUSED]
Description: "The percentage of unique trigrams in the link compared to the trigrams in the title."
Authors: "morph"
Responsibles: "morph"
}
Factor {
Index: 599
CppName: "FI_TRASH_ADV"
Name: "TrashAdv"
Ticket: "SEARCH-254"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/Antispam/AntiTrash/adv/TrashAdvFactor>"
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The number of advertisements on a page."
Authors: "vvp"
Responsibles: "alsafr"
}
Factor {
Index: 600
CppName: "FI_METRIKA_URL_VISITS"
Name: "MetrikaUrlVisits"
Ticket: ["BUKI-1148", "BUKI-1274"]
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/MetrikaUrlVisits>"
Tags: [TG_STATIC, TG_DOC, TG_USER, TG_COUNTER, TG_METRIKA, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_30D, TG_NN_OVER_FEATURES_USE]
Description: "Similar YabarUrlVisits"
Authors: "smikler"
Responsibles: ["smikler", "tarum", "niknik"]
}
Factor {
Index: 601
CppName: "FI_URLGEO_ADMS"
Name: "UrlGeoAdms"
Ticket: "QREG-23"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/geo/RegNavQueries>"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_REGION, TG_URL_TEXT, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: "The URL document is the same as the user's region (or state). ((<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/geo/RegNavQueries> /JandeksPoisk/KachestvoPoiska/geo/RegNavQueries))"
Authors: "esoloviev"
Responsibles: "esoloviev"
}
Factor {
Index: 602
CppName: "FI_URLGEO_CITY"
Name: "UrlGeoCity"
Ticket: "QREG-23"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/geo/RegNavQueries>"
Tags: [TG_DOC, TG_DYNAMIC, TG_LOCALIZED_CITY, TG_UNUSED]
Description: "The URL document is the same as the user's city."
Authors: "esoloviev"
Responsibles: "esoloviev"
}
Factor {
Index: 603
CppName: "FI_REG_NAV_QUERY"
Name: "RegNavQuery"
DependsOn: [{Feature: ["RegNavQuery"], Slice: "begemot_query_factors"}]
Ticket: "QREG-23"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/geo/RegNavQueries>"
Group: "Query"
Tags: [TG_QUERY_ONLY, TG_DYNAMIC, TG_LOCALIZED_CITY, TG_UNDOCUMENTED, TG_L2, TG_DEPRECATED]
Description: "Regional-navigational query - there is one or more navigational results for it in the user's region."
Authors: "esoloviev"
Responsibles: "esoloviev"
}
Factor {
Index: 604
CppName: "FI_YABAR_URL_LCAC"
Name: "YabarUrlLcAc"
Ticket: "BUKI-1295"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/YabarUrlLcAc>"
Tags: [TG_STATIC, TG_DOC, TG_USER, TG_BROWSER, TG_REARR_USE, TG_L2, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_VISITS_ACTIVITY_DOWNLOADS]
Description: "The number of sessions in which the URL was the last one, as the ratio of the number of sessions in which the URL appeared."
Authors: "snailer"
Responsibles: ["tarum", "niknik"]
}
Factor {
Index: 605
CppName: "FI_SOWNER_MAX_SUM_SOURCE_RANK"
Name: "SOMaxSumSourceRank"
Ticket: "BUKI-1214"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/SOMaxSumSourceRank>"
Tags: [TG_DOC, TG_LINK_GRAPH, TG_STATIC, TG_USER, TG_BROWSER, TG_COUNTER, TG_USER_SEARCH, TG_USER_EXT_DATA, TG_TRANS, TG_UNDOCUMENTED, TG_L2, TG_UNUSED]
Description: "The sum of the maximum values of SourceRank for each incoming link including the uniqueness of the owner."
Authors: "vvp"
Responsibles: "alsafr"
}
Factor {
Index: 606
CppName: "FI_DBM35"
Name: "DBM35"
Ticket: "BUKI-1303"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/DBM35>"
Group: "DBM25"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_REARR_USE, TG_UNDOCUMENTED, TG_LINK_TEXT, TG_DEPRECATED]
Description: "BM25 applied to texts and links with special weights based on the level of matching (form, lemma, synonym)."
Authors: "denplusplus"
Responsibles: "alsafr"
}
Factor {
Index: 607
CppName: "FI_TRLR_QUORUM_FM"
Name: "TRLRQuorumFm"
Ticket: "BUKI-1303"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/DBM35>"
Group: "TextAndLinkBM25"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_L2, TG_REARR_USE, TG_LINK_TEXT, TG_DEPRECATED]
Description: "The weight of the query words mentioned in the text in exact form."
Authors: "denplusplus"
Responsibles: "alsafr"
}
Factor {
Index: 608
CppName: "FI_TRLR_QUORUM_LEMMA"
Name: "TRLRQuorumLemma"
Ticket: "BUKI-1303"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/DBM35>"
Group: "TextAndLinkBM25"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_LINK_TEXT, TG_DEPRECATED]
Description: "The weight of the query words mentioned in the text with accuracy up to the lemma."
Authors: "denplusplus"
Responsibles: "alsafr"
}
Factor {
Index: 609
CppName: "FI_TRLR_QUORUM_SYN"
Name: "TRLRQuorumSyn"
Ticket: "BUKI-1303"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/DBM35>"
Group: "TextAndLinkBM25"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_LINK_TEXT, TG_DEPRECATED]
Description: "The weight of the query words mentioned in the text."
Authors: "denplusplus"
Responsibles: "alsafr"
}
Factor {
Index: 610
CppName: "FI_QUERY_ISHUM"
Name: "IsHum"
DependsOn: [{Feature: ["IsHum"], Slice: "begemot_query_factors"}]
Ticket: "BUKI-1316"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/IsHum>"
Group: "Query"
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_DEPRECATED]
Description: "The weight of the maximum encountered category Hum or Hum1 object in the query is reduced to basic searches under the name "ishum." (For more information, see ((<http://wiki.yandex-team.ru/AlekseySokirko/QueryObjects> som-овскую разметку))).((<http://wiki.yandex-team.ru/ArsenGadzhikurbanov/Wares#ishum>))"
Authors: "arseny"
Responsibles: "arseny"
}
Factor {
Index: 611
CppName: "FI_QUERY_ISTEXT"
Name: "IsText"
DependsOn: [{Feature: ["IsText"], Slice: "begemot_query_factors"}]
Ticket: "BUKI-1316"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/IsText>"
Group: "Query"
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_DEPRECATED]
Description: "It reduces the maximum weight of the encountered object of category Text or Text1 in the query to the basic search under the name "istext" (For more information, see ((<http://wiki.yandex-team.ru/AlekseySokirko/QueryObjects> som-овскую разметку))).((<http://wiki.yandex-team.ru/ArsenGadzhikurbanov/Wares#istext>))"
Authors: "arseny"
Responsibles: "arseny"
}
Factor {
Index: 612
CppName: "FI_QUERY_ISPICTURE"
Name: "IsPicture"
DependsOn: [{Feature: ["IsPicture"], Slice: "begemot_query_factors"}]
Ticket: "BUKI-1316"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/IsPicture>"
Group: "Query"
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_DEPRECATED]
Description: "It reduces the maximum weight of the encountered object of category Picture or Picture1 in the query to the basic search under the name "is picture" . (For more information, see ((<http://wiki.yandex-team.ru/AlekseySokirko/QueryObjects> som-овскую разметку))).((<http://wiki.yandex-team.ru/ArsenGadzhikurbanov/Wares#ispicture>))"
Authors: "arseny"
Responsibles: "arseny"
}
Factor {
Index: 613
CppName: "FI_QUERY_MAXONE"
Name: "MaxOne"
DependsOn: [{Feature: ["MaxOne"], Slice: "begemot_query_factors"}]
Ticket: "BUKI-1316"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/MaxOne>"
Group: "Query"
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_DEPRECATED]
Description: "It returns the maximum level of nominality of encountered objects in the query under the name "wmaxone". (For more information, see ((<http://wiki.yandex-team.ru/AlekseySokirko/QueryObjects> som-овскую разметку))).((<http://wiki.yandex-team.ru/ArsenGadzhikurbanov/Wares#maxone>))"
Authors: "arseny"
Responsibles: "arseny"
}
Factor {
Index: 614
CppName: "FI_QUERY_MINONE"
Name: "MinOne"
DependsOn: [{Feature: ["MinOne"], Slice: "begemot_query_factors"}]
Ticket: "BUKI-1316"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/MinOne>"
Group: "Query"
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_DEPRECATED]
Description: "It returns the minimum degree of nominality of encountered objects in the query under the name "wminone". (For more information, see ((<http://wiki.yandex-team.ru/AlekseySokirko/QueryObjects> som-овскую разметку))).((<http://wiki.yandex-team.ru/ArsenGadzhikurbanov/Wares#minone> Подробнее))"
Authors: "arseny"
Responsibles: "arseny"
}
Factor {
Index: 615
CppName: "FI_OQ_BM25_STR"
Name: "OqBm25Str"
Ticket: ["BUKI-1185", "BUKI-1270", "BUKI-1311", "BETATEST-2194"]
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/OqBm25Str>"
Tags: [TG_DYNAMIC, TG_DOWNER, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_DEPRECATED, TG_OFTEN_ZERO]
Description: "Bm25 based on query index for domAttr"
Authors: ["agorodilov", "vvp"]
Responsibles: ["agorodilov", "alsafr"]
}
Factor {
Index: 616
CppName: "FI_OQ_BM25_LEM"
Name: "OqBm25Lem"
Ticket: ["BUKI-1185", "BUKI-1270", "BUKI-1311", "BETATEST-2194"]
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/OqBm25Lem>"
Tags: [TG_DYNAMIC, TG_DOWNER, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_DEPRECATED, TG_OFTEN_ZERO]
Description: "Bm25 based on query index for domAttr"
Authors: ["agorodilov", "vvp"]
Responsibles: ["agorodilov", "alsafr"]
}
Factor {
Index: 617
CppName: "FI_OQ_BM25_SYN"
Name: "OqBm25Syn"
Ticket: ["BUKI-1185", "BUKI-1270", "BUKI-1311", "BETATEST-2194"]
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/OqBm25Syn>"
Tags: [TG_DYNAMIC, TG_DOWNER, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_DEPRECATED, TG_OFTEN_ZERO]
Description: "Bm25 based on query index for domAttr"
Authors: ["agorodilov", "vvp"]
Responsibles: ["agorodilov", "alsafr"]
}
Factor {
Index: 618
CppName: "FI_OQ_BCLM_WEIGHTED"
Name: "OqBclmWeighted"
Ticket: ["BUKI-1185", "BUKI-1270", "BUKI-1311", "BETATEST-2194"]
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/OqBclmWeighted>"
Tags: [TG_DYNAMIC, TG_DOWNER, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_DEPRECATED, TG_OFTEN_ZERO]
Description: "BCLM based on query index for domAttr"
Authors: ["agorodilov", "vvp"]
Responsibles: ["agorodilov", "alsafr"]
}
Factor {
Index: 619
CppName: "FI_OQ_BCLM_PLAIN"
Name: "OqBclmPlain"
Ticket: ["BUKI-1185", "BUKI-1270", "BUKI-1311", "BETATEST-2194"]
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/OqBclmPlain>"
Tags: [TG_DYNAMIC, TG_DOWNER, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_DEPRECATED, TG_OFTEN_ZERO]
Description: "BCLM based on query index for owners"
Authors: ["agorodilov", "vvp"]
Responsibles: ["agorodilov", "alsafr"]
}
Factor {
Index: 620
CppName: "FI_LINKS_ALIVE"
Name: "LinksAlive"
Ticket: "BUKI-1130"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/LinksAlive>"
Tags: [TG_STATIC, TG_DOC, TG_USER, TG_BROWSER, TG_LINK_GRAPH, TG_TRANS, TG_UNUSED, TG_OFTEN_ZERO, TG_L2]
Description: "Allows you to evaluate whether the document is 'live'(actibe) in terms of incoming links to it."
Authors: ["egoist", "vvp"]
Responsibles: ["egoist", "alsafr"]
}
Factor {
Index: 621
CppName: "FI_SMALL_WINDOW"
Name: "SmallWindow"
Ticket: "BUKI-1311"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/SmallWindow>"
Group: "CombinedAbs"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_DEPRECATED, TG_REARR_USE]
Description: "The maximum sum of the weight of query words in the step of 50 words"
Authors: "denplusplus"
Responsibles: "alsafr"
}
Factor {
Index: 622
CppName: "FI_METRIKA_URL_VISITORS"
Name: "MetrikaUrlVisitors"
Ticket: "BUKI-1148"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/MetrikaUrlVisitors>"
Tags: [TG_STATIC, TG_DOC, TG_USER, TG_COUNTER, TG_METRIKA, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_30D, TG_NN_OVER_FEATURES_USE]
Description: "Similar YabarUrlVisitors"
Authors: "smikler"
Responsibles: ["smikler", "tarum", "niknik"]
}
Factor {
Index: 623
CppName: "FI_METRIKA_URL_AVG_TIME"
Name: "MetrikaUrlAvgTime"
Ticket: "BUKI-1148"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/MetrikaUrlAvgTime>"
Tags: [TG_STATIC, TG_DOC, TG_USER, TG_COUNTER, TG_METRIKA, TG_L2, TG_REARR_USE, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_30D, TG_NN_OVER_FEATURES_USE]
Description: "Similar YabarUrlAvgTime"
Authors: "smikler"
Responsibles: ["smikler", "tarum", "niknik"]
}
Factor {
Index: 624
CppName: "FI_METRIKA_URL_CORE_AUDIENCE"
Name: "MetrikaUrlCoreAudience"
Ticket: "BUKI-1268"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/MetrikaUrlCoreAudience>"
Tags: [TG_STATIC, TG_DOC, TG_USER, TG_COUNTER, TG_METRIKA, TG_DEPRECATED, TG_UNUSED]
Description: "The core of the audience of pages with the counter Yandex Metrica"
Authors: "smikler"
Responsibles: "smikler"
}
Factor {
Index: 625
CppName: "FI_REGEX_MAX_CLICK_PERCENT"
Name: "RegexMaxClickPercent"
Ticket: "BUKI-1300"
Wiki: "<http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/regexmaxclickpercent>"
Group: "Regex"
Tags: [TG_DYNAMIC, TG_DOC, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_L2, TG_DEPRECATED]
Description: "The ratio of clicks on this URL to all clicks on similar queries"
Authors: "finder"
Responsibles: ["smikler", "tsimkha"]
}
Factor {
Index: 626
CppName: "FI_REGEX_CTR"
Name: "RegexCtr"
Ticket: "BUKI-1300"
Wiki: "<http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/regexctr>"
Group: "Regex"
Tags: [TG_DYNAMIC, TG_DOC, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_L2, TG_DEPRECATED]
Description: "corrected CTR of this url for all related queries"
Authors: "finder"
Responsibles: ["smikler", "tsimkha"]
}
Factor {
Index: 627
CppName: "FI_DOM_PHRASE_CLICK_RANK_BI"
Name: "DomPhraseClickRankBi"
Ticket: "BUKI-1278"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/Domfeat>"
Group: "Domain"
Tags: [TG_DYNAMIC, TG_DOWNER, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_DEPRECATED, TG_UNDOCUMENTED]
Description: "Domain click-through rate by bigrams (excluding thesaurus query extensions)"
Authors: ["finder", "kartynnik"]
Responsibles: ["kartynnik","akhropov"]
}
Factor {
Index: 628
CppName: "FI_DOM_PHRASE_YABAR_BI"
Name: "DomPhraseYabarBi"
Ticket: "BUKI-1278"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/Domfeat>"
Group: "Domain"
Tags: [TG_DYNAMIC, TG_DOWNER, TG_USER, TG_BROWSER, TG_USER_SEARCH, TG_DEPRECATED, TG_UNDOCUMENTED]
Description: "Traffic to the site from search engines by bigrams, according to Bar (excluding thesaurus query extensions)"
Authors: ["finder", "kartynnik"]
Responsibles: ["kartynnik","akhropov"]
}
Index: 629
CppName: "FI_LAST_WORD_HOST_CLICKS"
Name: "LastWordHostClicks"
Ticket: "BUKI-1278"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/Domfeat>"
Group: "Domain"
Tags: [TG_DYNAMIC, TG_OWNER, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_DEPRECATED, TG_UNDOCUMENTED, TG_OFTEN_ZERO]
Description: "Clickability of the host for the last query word (excluding thesaurus query extensions)"
Authors: ["finder", "kartynnik"]
Responsibles: ["kartynnik","akhropov"]
}
Factor {
Index: 630
CppName: "FI_HOST_HAS_FEED_URLS"
Name: "HostHasFeedUrls"
Ticket: "SEARCHSPAM-15486"
Authors: ["bikulov"]
Responsibles: ["bikulov", "ulyanov"]
Description: "OffersBase feature for ecoboost."
Tags: [TG_HOST, TG_STATIC, TG_OFTEN_ZERO, TG_META_OVERWRITE, TG_UNUSED, TG_DATA_FROM_SAASKV, TG_UNIMPLEMENTED],
}
Factor {
Index: 631
CppName: "FI_IS_FEED_OFFER"
Name: "IsFeedOffer"
Ticket: "SEARCHSPAM-15486"
Authors: ["bikulov"]
Responsibles: ["bikulov", "ulyanov"]
Description: "OffersBase feature for ecoboost."
Tags: [TG_DOC, TG_STATIC, TG_BINARY, TG_OFTEN_ZERO, TG_META_OVERWRITE, TG_UNUSED, TG_DATA_FROM_SAASKV, TG_UNIMPLEMENTED],
}
Factor {
Index: 632
CppName: "FI_HOST_ECOM_KERNEL_1"
Name: "HostEcomKernel1"
Ticket: "SEARCHSPAM-15417"
Authors: ["ngoltsova", "sdormidontov"]
Responsibles: ["bikulov", "ngoltsova", "sdormidontov"]
Description: "Business kernel."
Tags: [TG_OWNER, TG_STATIC, TG_OFTEN_ZERO, TG_META_OVERWRITE, TG_UNUSED, TG_DATA_FROM_SAASKV, TG_UNIMPLEMENTED],
}
Factor {
Index: 633
CppName: "FI_HOST_ECOM_KERNEL_2"
Name: "HostEcomKernel2"
Ticket: "SEARCHSPAM-15417"
Authors: ["ngoltsova", "sdormidontov"]
Responsibles: ["bikulov", "ngoltsova", "sdormidontov"]
Description: "Business kernel."
Tags: [TG_OWNER, TG_STATIC, TG_OFTEN_ZERO, TG_META_OVERWRITE, TG_UNUSED, TG_DATA_FROM_SAASKV],
ImplementationTime: "2020-09-24"
}
Factor {
Index: 634
CppName: "FI_HOST_ECOM_KERNEL_3"
Name: "HostEcomKernel3"
Ticket: "SEARCHSPAM-15417"
Authors: ["ngoltsova", "sdormidontov"]
Responsibles: ["bikulov", "ngoltsova", "sdormidontov"]
Description: "Business kernel."
Tags: [TG_OWNER, TG_STATIC, TG_OFTEN_ZERO, TG_META_OVERWRITE, TG_UNUSED, TG_DATA_FROM_SAASKV, TG_UNIMPLEMENTED],
}
Factor {
Index: 635
CppName: "FI_RC_SEARCH_BASE_URL_RATIONAL_SIGMOID_D1TM600_AT_REQ"
Name: "RcSearchBaseUrlRationalSigmoidD1TM600AtReq"
Group: "RapidClicks"
Tags: [TG_STATIC, TG_DOC, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_L2, TG_SEARCH_RAPID_CLICKS_BIGRT, TG_DATA_FROM_BIGRT, TG_UNDOCUMENTED, TG_UNUSED]
Description: "URL feature computed at the request time from rapid clicks search counters with decay of 1 day"
Ticket: "USERFEAT-1503"
Authors: ["skorodumov-s"]
Responsibles: ["skorodumov-s", "tarum"]
ImplementationTime: "2020-10-04"
}
Factor {
Index: 636
CppName: "FI_SYNSET_LOCM"
Name: "SynSetLocm"
Ticket: "SEARCH-218"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/SynSetLocm>"
Group: "SynSetLocm"
Tags: [TG_DYNAMIC, TG_DOC, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_LINK_TEXT, TG_DEPRECATED]
Description: "Factor copy ((<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/Locm> LOCM)) for((<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/Synset> synsets))."
Authors: "alexeykruglov"
Responsibles: "alexeykruglov"
}
Factor {
Index: 637
CppName: "FI_SYNSET_LINK_BM25"
Name: "SynSetLinkBM25"
Ticket: "SEARCH-218"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/SynSetLinkBM25>"
Group: "Dynamic"
Tags: [TG_DYNAMIC, TG_DOC, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_LINK_TEXT, TG_OFTEN_ZERO, TG_DEPRECATED]
Description: "Copy of the LinkBM25 factor for ((<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/Synset> synsets))."
Authors: "alexeykruglov"
Responsibles: "alexeykruglov"
}
Factor {
Index: 638
CppName: "FI_RC_SEARCH_BASE_URL_CONTRAST_D30ODD0_9_X_D30T1_AT_REQ"
Name: "RcSearchBaseUrlContrastD30Odd0_9_X_D30T1AtReq"
Group: "RapidClicks"
Tags: [TG_STATIC, TG_DOC, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_L2, TG_SEARCH_RAPID_CLICKS_BIGRT, TG_DATA_FROM_BIGRT, TG_UNDOCUMENTED, TG_UNUSED]
Description: "URL feature computed at the request time from rapid clicks search counters with decay of 30 days"
Ticket: "USERFEAT-1503"
Authors: ["skorodumov-s"]
Responsibles: ["skorodumov-s", "tarum"]
ImplementationTime: "2020-10-04"
}
Factor {
Index: 639
CppName: "FI_REMOVED_639"
Name: "Removed_639"
Tags: [TG_REMOVED]
}
Factor {
Index: 640
CppName: "FI_DMOZ_QUERY_BEST_THEME"
Name: "DmozQueryBestTheme"
DependsOn: [{Feature: ["DmozQueryBestTheme"], Slice: "begemot_query_factors"}]
Ticket: "FOREIGN-221"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/DmozQueryBestTheme>"
Group: "Query"
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_THEME_CLASSIF, TG_UNDOCUMENTED, TG_L2, TG_DEPRECATED]
Description: "The query’s topic with the highest probability, determined by ((<http://wiki.yandex-team.ru/JandeksPoisk/ZarubezhnyjjInternet/DMOZqueryClassifier1> by the DMOZTheme wizard's rule)), only the most popular topics are considered (but there are more of them than in the DmozQueryThemes factor). The factor contains the probability that the query matches the topic, but for each topic, its own interval is taken on the segment [0..1]"
Authors: "lamo"
Responsibles: "lamo"
}
Factor {
Index: 641
CppName: "FI_DMOZ_QUERY_THEMES"
Name: "DmozQueryThemes"
DependsOn: [{Feature: ["DmozQueryThemes"], Slice: "begemot_query_factors"}]
Ticket: "FOREIGN-221"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/DmozQueryThemes>"
Group: "Query"
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_THEME_CLASSIF, TG_UNDOCUMENTED, TG_L2, TG_DEPRECATED]
Description: "The query topic determined by ((<http://wiki.yandex-team.ru/JandeksPoisk/ZarubezhnyjjInternet/DMOZqueryClassifier1> by the DMOZTheme wizard's rule)) only a few of the most popular topics are considered."
Authors: "lamo"
Responsibles: "lamo"
}
Factor {
Index: 642
CppName: "FI_DIVERSITY_CATEG_NEED_PHOTO"
Name: "DiversityCategNeedPhoto"
DependsOn: [{Feature: ["DiversityCategNeedPhoto"], Slice: "begemot_query_factors"}]
Ticket: "BUKI-1213"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/DiversityCategFactors>"
Group: "Query"
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_THEME_CLASSIF, TG_UNDOCUMENTED, TG_L2, TG_DEPRECATED]
Description: "0 or 1 depending on whether the request has an explicit need_photo intent from the variety"
Authors: "stasd07"
Responsibles: "stasd07"
}
Factor {
Index: 643
CppName: "FI_DIVERSITY_CATEG_NEED_MAP"
Name: "DiversityCategNeedMap"
DependsOn: [{Feature: ["DiversityCategNeedMap"], Slice: "begemot_query_factors"}]
Ticket: "BUKI-1213"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/DiversityCategFactors>"
Group: "Query"
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_THEME_CLASSIF, TG_UNDOCUMENTED, TG_L2, TG_DEPRECATED]
Description: "0 or 1 depending on whether the request has an explicit need_map intent from the variety"
Authors: "stasd07"
Responsibles: "stasd07"
}
Factor {
Index: 644
CppName: "FI_LONG_QUERY_SYN"
Name: "LongQuerySyn"
DependsOn: [{Feature: ["LongQuerySyn"], Slice: "begemot_query_factors"}]
Ticket: "BUKI-1361"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/LongQuerySyn>"
Group: "Query"
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_UNDOCUMENTED, TG_L2, TG_L3_OVERWRITE, TG_DEPRECATED]
Description: "Factor is similar to LongQuery (sum of idf query words), but with 'correct' consideration of synonyms. Specifically, the minimum number of idf (that is, the most frequent) of the synonyms."
Authors: "morph"
Responsibles: "morph"
}
Factor {
Index: 645
CppName: "FI_URL_HAS_SHORT_COUNTRY_NAME_TOKEN"
Name: "UrlHasShortCountryNameToken"
Ticket: "FACTOR-2431"
Tags: [TG_DYNAMIC, TG_URL_TEXT, TG_LOCALIZED_COUNTRY, TG_L2, TG_BINARY, TG_NN_OVER_FEATURES_USE]
Description: "The URL contains a token that matches the short name of the user's country. The factor is calculated only on the EU stream."
Authors: "filmih"
Responsibles: "filmih"
ImplementationTime: "2020-09-24"
}
Factor {
Index: 646
CppName: "FI_TURKEY_PAGE_RANK"
Name: "TurkeyPageRank"
Ticket: "FOREIGN-225"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/TurkeyPageRank>"
Tags: [TG_LINK_GRAPH, TG_OWNER, TG_STATIC, TG_LOCALIZED_COUNTRY, TG_UNDOCUMENTED, TG_UNUSED, TG_OFTEN_ZERO]
Countries: CNT_TR
Description: "Personalized Turkish PageRank"
Authors: "lamo"
Responsibles: "lamo"
}
Factor {
Index: 647
CppName: "FI_EXPECTED_FOUND"
Name: "ExpectedFound"
Ticket: "FOREIGN-225"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/ExpectedFound>"
Group: "Query"
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_UNDOCUMENTED, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_NN_OVER_FEATURES_USE]
Description: "Expected amount of results on the query"
Authors: "denplusplus"
Responsibles: "alsafr"
}
Factor {
Index: 648
CppName: "FI_FOOTER_IN_LINKS_TRIGRAMS"
Name: "FooterInLinksTrigrams"
Ticket: "BUKI-1341"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/FooterInLinksTrigrams>"
Tags: [TG_DOC, TG_DOC_TEXT, TG_LINK_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_DEPRECATED]
Description: "Percentage of unique footer snippet trigrams in link trigrams"
Authors: "morph"
Responsibles: "morph"
}
Factor {
Index: 649
CppName: "FI_LINKS_IN_FOOTER_TRIGRAMS"
Name: "LinksInFooterTrigrams"
Ticket: "BUKI-1341"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/FooterInLinksTrigrams>"
Tags: [TG_DOC, TG_DOC_TEXT, TG_LINK_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_DEPRECATED]
Description: "Percentage of Unique Link Trigrams in Footer Trigram Fragment"
Authors: "morph"
Responsibles: "morph"
}
Factor {
Index: 650
CppName: "FI_ERRATUM_LOG_QUERY_PROBABILITY"
Name: "ErratumLogQueryProbability"
DependsOn: [{Feature: ["ErratumLogQueryProbability"], Slice: "begemot_query_factors"}]
Ticket: "BUKI-1388"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/ErratumLogQueryProbability>"
Group: "Query"
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_USER, TG_BROWSER, TG_COUNTER, TG_USER_SEARCH, TG_USER_EXT_DATA, TG_UNDOCUMENTED, TG_L2, TG_DEPRECATED]
Description: "The binary logarithm of the probability of the query based on the language model of the erratum typo service"
Authors: "snow"
Responsibles: ["snow", "khristich"]
}
Factor {
Index: 651
CppName: "FI_URL_IS_MARKET_OFFER"
Name: "UrlIsMarketOffer"
Ticket: "COMMERCIAL-41"
Description: "Url is an offer in the latest version of the market database."
Tags: [TG_DOC, TG_STATIC, TG_OFTEN_ZERO, TG_UNUSED]
Authors: ["hygge", "alejes"]
Responsibles: ["hygge", "alejes"]
ImplementationTime: "2020-09-27"
}
Factor {
Index: 652
CppName: "FI_DBM40"
Name: "DBM40"
Group: "DBM25"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_NN_OVER_FEATURES_USE]
Description: "Variation on a theme ((<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/DBM25> DBM25)), see ysite/yandex/relevance/dbm25.cpp"
Authors: "denplusplus"
Responsibles: "alsafr"
}
# TODO(FACTORDEL-97): replace with TG_REMOVED, TG_REUSABLE and remove old formulas
Factor {
Index: 653
CppName: "FI_REMOVED_653"
Name: "Removed_653"
Tags: [TG_UNUSED]
}
Factor {
Index: 654
CppName: "FI_BM25_0"
Name: "BM25_0"
Ticket: "FOREIGN-225"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/ExpectedFound>"
Group: "DBM25"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: "Variation of BM25"
Authors: "denplusplus"
Responsibles: "alsafr"
}
Factor {
Index: 655
CppName: "FI_BM25_1"
Name: "BM25_1"
Ticket: "FOREIGN-225"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/ExpectedFound>"
Group: "DBM25"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: "Variation of BM25"
Authors: "denplusplus"
Responsibles: "alsafr"
}
Factor {
Index: 656
CppName: "FI_BM25_0123"
Name: "BM25_0123"
Ticket: "FOREIGN-225"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/ExpectedFound>"
Group: "DBM25"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: "Variation of BM25"
Authors: "denplusplus"
Responsibles: "alsafr"
}
Factor {
Index: 657
CppName: "FI_QUERY_URL_CORRECTED_CTR"
Name: "QueryUrlCorrectedCtr"
Ticket: "BUKI-1291"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/QueryUrlCorrectedCtr>"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_1832D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_SEARCH_DWELL_TIME, TG_USERFEAT_USF, TG_FORMULA_2245_DEP_2, TG_DEPRECATED]
Countries: CNT_RELEV
Description: "'Fixed' clicks counted with RequestAggregateLib"
Authors: "kcd"
Responsibles: ["smikler", "tarum", "niknik"]
}
Factor {
Index: 658
CppName: "FI_QUERY_URL_CORRECTED_CTR_REG"
Name: "QueryUrlCorrectedCtr_Reg"
Ticket: "BUKI-1291"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/QueryUrlCorrectedCtr>"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_REGION, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_LOCALIZED_COUNTRY, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_1832D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_SEARCH_DWELL_TIME, TG_USERFEAT_USF, TG_FORMULA_2245_DEP_2, TG_DEPRECATED]
Countries: CNT_RELEV
Description: "'Fixed' clicks counted with RequestAggregateLib. Regional version"
Authors: "kcd"
Responsibles: ["smikler", "tarum", "niknik"]
}
Factor {
Index: 659
CppName: "FI_YABAR_URL_VISITS_REG"
Name: "YabarUrlVisits_Reg"
Ticket: "BUKI-1180"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/YabarUrlFactors>"
Group: "RegDocStatic"
Tags: [TG_STATIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_BROWSER, TG_USER_EXT_DATA, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_VISITS_ACTIVITY_DOWNLOADS]
Countries: CNT_RELEV
Description: "Regional url traffic based on Yandex bar"
Authors: "akhropov"
Responsibles: ["tarum", "niknik"]
}
Factor {
Index: 660
CppName: "FI_METRIKA_URL_HOST_VISIT_TIME"
Name: "MetrikaUrlHostVisitTime"
Ticket: ["BUKI-1272", "BUKI-1312"]
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/MetrikaUrlHostVisitTime>"
Tags: [TG_STATIC, TG_DOC, TG_USER, TG_COUNTER, TG_METRIKA, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_30D, TG_NN_OVER_FEATURES_USE]
Description: "The average time a user spends on a host accessed externally (from another non-search site) from a specific URL"
Authors: ["gosu", "smikler"]
Responsibles: ["smikler", "tarum", "niknik"]
}
Factor {
Index: 661
CppName: "FI_METRIKA_URL_HOST_VISIT_DEPTH"
Name: "MetrikaUrlHostVisitDepth"
Ticket: ["BUKI-1271", "BUKI-1312"]
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/MetrikaUrlHostVisitDepth>"
Tags: [TG_STATIC, TG_DOC, TG_USER, TG_COUNTER, TG_METRIKA, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_30D, TG_NN_OVER_FEATURES_USE]
Description: "Average 'depth' (number of hits within the host) of a user's visit of the host accessed externally (from another non-search site) from a particular URL"
Authors: ["gosu", "smikler"]
Responsibles: ["smikler", "tarum", "niknik"]
}
Factor {
Index: 662
CppName: "FI_DBM_NUMBERS"
Name: "DBMNumbers"
Group: "DBM25"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_NN_OVER_FEATURES_USE]
Description: "DBM separately based on numbers"
Authors: "denplusplus"
Responsibles: "alsafr"
}
Factor {
Index: 663
CppName: "FI_DBM_GEO"
Name: "DBMGeo"
Group: "DBM25"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_NN_OVER_FEATURES_USE]
Description: "DBM separately based on request geo-objects"
Authors: "denplusplus"
Responsibles: "alsafr"
}
Factor {
Index: 664
CppName: "FI_DBM_SUBSTANTIVE"
Name: "DBMSubstantive"
Group: "DBM25"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_NN_OVER_FEATURES_USE]
Description: "DBM separately based on noun"
Authors: "denplusplus"
Responsibles: "alsafr"
}
Factor {
Index: 665
CppName: "FI_AVG_SESSION_LEN"
Name: "AvgSessionLen"
DependsOn: [{Feature: ["AvgSessionLen"], Slice: "begemot_query_factors"}]
Group: "Query"
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_L2, TG_USERFEAT, TG_USERFEAT_90D, TG_DEPRECATED]
Description: "The average length of the logical session from the query"
Wiki: "<http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/AvgSessionLen>"
Authors: "denplusplus"
Responsibles: ["tarum", "niknik"]
}
Factor {
Index: 666
CppName: "FI_NHOP_TEXT_BCLM_WEIGHTED"
Name: "NHopTextBclmWeighted"
Group: "Annotation"
Ticket: "FACTOR-108"
Wiki: "<http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/NHopText>"
Tags: [TG_DYNAMIC, TG_DOC, TG_USER, TG_BROWSER, TG_USER_SEARCH, TG_USER_EXT_DATA, TG_LOCALIZED_COUNTRY, TG_ANNOTATION_FILTER, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_238D, TG_USERFEAT_NHOP]
Countries: CNT_RELEV
Description: "Bclm (weighted) based on texts from hops."
Authors: "vvp"
Responsibles: "alsafr"
}
Factor {
Index: 667
CppName: "FI_YABAR_URL_DOWNLOADS"
Name: "YabarUrlDownloads"
Ticket: "SEARCHSPAM-3039"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/YabarUrlDownloads>"
Tags: [TG_STATIC, TG_DOC, TG_USER, TG_BROWSER, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_VISITS_ACTIVITY_DOWNLOADS]
Description: "The probability of something being downloaded from a document"
Authors: "ulyanov"
Responsibles: ["ulyanov", "tarum", "niknik"]
}
Factor {
Index: 668
CppName: "FI_BOCM"
Name: "Bocm"
Ticket: "BUKI-1495"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/Bocm>"
Group: "Bocm"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_NN_OVER_FEATURES_USE]
Description: "Evaluates word positions in document sentences in accordance with word positions in a query."
Authors: "alsafr"
Responsibles: "alsafr"
}
Factor {
Index: 669
CppName: "FI_HOST_USER_LEAKAGE"
Name: "HostUserLeakage"
Ticket: "COMMERCIAL-55"
Tags: [TG_OWNER, TG_STATIC, TG_L2, TG_NOT_01, TG_DATA_FROM_SAASKV, TG_UNUSED]
Description: "Bounce rate from the search after visiting the site"
Authors: "alejes"
Responsibles: "alejes"
MaxValue: 1.0
MinValue: -1.0
ImplementationTime: "2020-08-27"
}
Factor {
Index: 670
CppName: "FI_FIO_MATCH"
Name: "FioMatch"
Ticket: "FACTEX-2467"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/OpisanijaFaktorov/FioMatchFactor>"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNUSED]
Description: "The document contains the full name from the query."
Authors: "udovichenko-r"
Responsibles: "udovichenko-r"
}
Factor {
Index: 671
CppName: "FI_IS_INDEX_PAGE"
Name: "IsIndexPage"
Ticket: "FORMULATOR-185"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/IsIndexPage>"
Tags: [TG_DOC, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "This is index.(html/php/aspx?/...), without cgi parameters. It’s calculated based on all duplicates."
Authors: "smikler"
Responsibles: "smikler"
}
Factor {
Index: 672
CppName: "FI_IS_INDEX_PAGE_SOFT"
Name: "IsIndexPageSoft"
Ticket: "FORMULATOR-185"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/IsIndexPage>"
Tags: [TG_DOC, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "It's index.(html/php/aspx?/...), possibly with cgi options. It’s calculated based on all duplicates."
Authors: "smikler"
Responsibles: "smikler"
}
Factor {
Index: 673
CppName: "FI_IS_OWNER"
Name: "IsOwner"
Ticket: "FORMULATOR-185"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/IsIndexPage>"
Tags: [TG_HOST, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "Whether the host is its own owner, conditionally Host == Owner(Host)."
Authors: "smikler"
Responsibles: "smikler"
}
Factor {
Index: 674
CppName: "FI_MIN_PATH_LEN"
Name: "MinPathLen"
Ticket: "FORMULATOR-185"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/IsIndexPage>"
Tags: [TG_DOC, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The minimum length of PathAndQuery based on all half-doubles."
Authors: "smikler"
Responsibles: "smikler"
}
Factor {
Index: 675
CppName: "FI_LERF_GEO_LR_LOG_RELEV_CNT"
Name: "XLerfGeoLRlogRelevCnt"
Ticket: "BUKI-1433"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/XLerfGeoLRlogRelevCnt>"
Group: "Xref"
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: "Regional (only links from the country of the query are considered) version of the XLerfGeoLRlogRelev factor"
Authors: "mdvornikov"
Responsibles: "mdvornikov"
}
Factor {
Index: 676
CppName: "FI_NON_COMM_LERF_NORM_LR_LOG_RELEV_CNT"
Name: "XNonCommLerfNormLRlogRelevCnt"
Ticket: "BUKI-1433"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/XNonCommLerfNormLRlogRelevCnt>"
Group: "Xref"
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: "Regional (only links from the country of the query are considered) version of the XNonCommLerfNormLRlogRelev factor"
Authors: "mdvornikov"
Responsibles: "mdvornikov"
}
Factor {
Index: 677
CppName: "FI_LOCM_CNT"
Name: "LocmCnt"
Ticket: "BUKI-1433"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/LocmCnt>"
Group: "Xref"
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: "Regional (only links from the country of the query are considered) version of the Locm factor"
Authors: "mdvornikov"
Responsibles: "mdvornikov"
}
Factor {
Index: 678
CppName: "FI_LR_RELEV_CNT"
Name: "XLRrelevCnt"
Ticket: "BUKI-1433"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/XLRrelevCnt>"
Group: "Xref"
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: "Regional (only links from the country of the query are considered) version of the XLRrelev factor"
Authors: "mdvornikov"
Responsibles: "mdvornikov"
}
Factor {
Index: 679
CppName: "FI_LERF_LR_RELEV_200_CNT"
Name: "XLerfLRrelev200Cnt"
Ticket: "BUKI-1433"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/XLerfLRrelev200Cnt>"
Group: "Xref"
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: "Regional (only links from the country of the query are considered) version of the XLerfLRrelev200 factor"
Authors: "mdvornikov"
Responsibles: "mdvornikov"
}
Factor {
Index: 680
CppName: "FI_NAV_LINEAR"
Name: "NavLinear"
Ticket: ["COMBPROLAB-107", "SEARCHSPAM-3340"]
Wiki: "<http://wiki.yandex-team.ru/MaratXabibraxmanov/seminavigationqueries>"
Tags: [TG_DYNAMIC, TG_DOC, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_NAV, TG_TRANS, TG_REARR_USE, TG_DEPRECATED]
Description: "((<http://wiki.yandex-team.ru/JandeksPoisk/Antispam/polunavigacionnyezaprosy#faktornavigacionnostiparyurl-zapros> classifier)) pairs of vitals [request-url], vital url for the request if its value is >0.5"
Authors: ["burangulov", "kustarev"]
Responsibles: "burangulov"
DependsOn: [{Feature: ["PR", "LR", "PrBonus", "TRp2", "LRp2", "Shop", "YaBar", "Long", "LongQuery", "SR", "LRHitNum100", "PctLinks", "LinkQuality", "AddTime", "TLBM25", "Adv", "YandexAdv", "TxtPair", "TxtHead", "HasNoQueryShows", "LogLR", "TxtPairEx", "TxtBreakEx", "TxtHeadEx", "TxtPairSy", "TxtBreakSy", "TxtHeadSy", "TxtHiRelSy", "QueryDOwnerClicksPCTR", "HasNoQueryDOwnerShows", "OwnerClicksPCTR", "XLRp2", "XLRgood", "XLRmaxDpr", "NewLinkQuality", "TextFeatures", "TextLike", "SpamKarma", "DocLen", "UrlLen", "HostSize", "LinkSpeed", "XLerfLRlogRelev", "GeoCityProxim", "LinksWithWordsPercent", "LinksWithAllWordsPercent", "IsComm", "GeoRegionProxim", "TxtSkipPair", "QDiversity", "XGeoLRlogRelev", "XLerfGeoLRlogRelev", "XNonCommNormLRlogRelev", "Nevasca2", "LinkAge", "XLerfLangLRlogRelev", "QueryDOwnerClicksFRC", "QueryDOwnerClicksPCTR_Reg", "QueryURLClicksFRC_Reg", "QueryDOwnerClicksFRC_Reg", "QueryDOwnerClicksCombo_Reg", "XLRCatalogRelev", "TLp1All", "BFlemmaAll", "PassageLegacyTR", "TxtBM25AttenSyn", "MaxWordHostRank", "MaxWordHostClicks", "DomPhraseClickRank", "EshopValue", "CountersSearchTraffic1", "CountersSearchTraffic2", "DomPhraseYabar", "GeoRelevRegionCountry", "XLRGeoRelevRegionCountry", "GeoCountryProxim", "MaxWordHostYaBar", "FirstWordHostClicks", "QueryDOwnerYabarVisits", "QueryDOwnerYabarVisitors", "QueryDOwnerYabarAvgTime", "PageRegionSizeIn", "PageRegionInvSizeIn", "GeoGeometryProxim", "RingsHostRankBadnessOld", "YabarHostVisitors", "YabarHostSearchTraffic", "YabarHostInternalTraffic", "YabarHostAvgTime", "YabarHostAvgTime2", "YabarHostAvgActions", "YabarUrlVisits", "YabarUrlVisitors", "YabarUrlAvgTime", "OwnerSatisfied4Rate", "TitleIdfSum_broken", "HeadingIdfSum_broken", "CommLinksSEOHosts", "CommLinksSEOHostsNonComm", "Diversity2", "MorningQuery", "LCor", "SubqueryThMatchA", "OwnerSDiffClickEntropy", "OwnerSDiffShowEntropy", "OwnerSDiffCSRatioEntropy", "UrlDomainFraction", "UrlPathAndParamsFraction", "LnkBreak", "LnkPairSy", "LnkBrkSy", "OwnerClicksPCTR_Reg", "OwnerSDiffClickEntropy_Reg", "OwnerSDiffShowEntropy_Reg", "OwnerSDiffCSRatioEntropy_Reg", "IsCom", "IsNotRu", "LargestSyInexactGroup", "SynFLremap1", "SynFLremap2", "OwnerSessNormDuration", "UrlSessNormDurRate", "QueryDOwnerWeightClick", "QueryDOwnerOnlyClickRate", "QueryDOwnerClickSummary", "QueryDOwnerSatisfied4Rate", "SyntQuality", "PageDate", "RingsHostRankBadness3", "QSegmentsBM25", "QSegmentsWeight", "NumLatinLetters", "RingsHostRankBadness1", "TitleIdfSumFixed", "HeadingIdfSumFixed", "QueryDOwnerClicksCombo", "LRAmortizedByAge", "RusWordsInTitle", "MeanWordLength", "PercentWordsInLinks", "PercentVisibleContent", "PercentFreqWords", "PercentUsedFreqWords", "TrigramsProb", "TrigramsCondProb", "UrlBM25", "MatrixNet", "DaterAge", "CInDegree2", "TextMaxForms", "TextWeightedForms", "TextForms", "LinkWeightedForms", "QSegmentsBreaks", "ParticlesPortion", "AdjPronounsPortion", "AdvPronounsPortion", "FemAndMasNounsPortion", "LinkQualityFixed", "NewLinkQualityFixed", "IsOrg", "LongestText", "LRWithoutRare", "DifferentInternalLinks", "HasDeterminedCities", "UkrainPageRank", "QClassOAO", "PeriodicLinkDatesPercent", "QDOwnerStatPower", "QUrlStatPower", "OwnerReqsPopularity", "SecondIndegDistrXi", "Swbm25", "PositionLanguageModel", "TxtPair_W1", "AuraDocLogShared", "AuraDocLogAuthor", "AuraDocMeanSharedWeight", "RegHostRank", "LanguageCompliance", "CountryQDiversity", "CountryQDiversity2", "CountryQueryRegionality", "NumSlashes", "BM25FdPR_obsolete", "GskUrlModel", "UrlTrigrams", "YmwFull", "Bclm", "QueryCommercialityMx", "FieldLM", "GeoCityUrlRegionCountry", "TitleTrigramsQuery", "QueryWordSequencesTR", "OwnerNavQuota", "GeoRelevAlienCity", "HostReliability", "Mpsa", "PageRegionCoverage", "PageRegionSize", "PageRegionRelCoverage", "IsGeo", "CityQuery", "YmwFull2", "QueryWordCohesionTR", "QueryDOwnerWeightClick_Reg", "QueryDOwnerOnlyClickRate_Reg", "QueryDOwnerClickSummary_Reg", "QueryDOwnerSatisfied4Rate_Reg", "SegmentAuxAlphasInText", "SegmentAuxSpacesInText", "IsShop", "XLRGeoRelevRegionNatDomain", "QueryRefTrigramQuery", "QueryRefTrigramReferences", "IdfVariance", "UrlNGramsModel", "NumLinksFromSegmentContent", "Locm", "UrlQueryVariety_Reg", "UrlSessNormDurRate_Reg", "QueryDownerEnoughClicked", "BM25FdPRFixed", "QueryDOwnerWeightedSumFRCAndBM25FdPRFixed", "QueryDOwnerWeightedSumMaxWHRAndOnlyClickRate", "Tocm", "RelevGeoLinksPercent", "UrlLinkPercent", "NumNonLettersInUrl", "UrlLen2", "IsHub", "StaticTitleBM25Ex", "StaticTitleLRBM25", "SeoInPayLinks", "TitleInLinksTrigrams", "LinksInTitleTrigrams", "YabarUrlLcAc", "SOMaxSumSourceRank", "DBM35", "TRLRQuorumFm", "TRLRQuorumLemma", "IsHum", "MaxOne", "MinOne", "OqBm25Str", "OqBm25Lem", "OqBm25Syn", "OqBclmWeighted", "OqBclmPlain", "MetrikaUrlCoreAudience", "DomPhraseClickRankBi", "DomPhraseYabarBi", "LastWordHostClicks", "SynSetLocm", "DmozQueryBestTheme", "LongQuerySyn", "ExpectedFound"]}]
}
Factor {
Index: 681
CppName: "FI_RANK_COM_GOODNESS"
Name: "RankComGoodness"
Ticket: ["BUKI-1504", "SEARCHSPAM-3204"]
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/RankComGoodness>"
Tags: [TG_COMMERCIAL, TG_OWNER, TG_STATIC, TG_THEME_CLASSIF, TG_UNDOCUMENTED, TG_L2, TG_MASCOT, TG_NN_OVER_FEATURES_USE]
Description: "Classifier based on commercial sites"
Authors: ["anelyubin", "sisoid"]
Responsibles: "efedina"
}
Factor {
Index: 682
CppName: "FI_HAS_DOWNLOAD_LINK_ON_FILE"
Name: "HasDownloadLinkOnFile"
Ticket: "ROBOT-2682"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/HasDownloadLinkOnFile>"
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The document has a direct link to the file"
Authors: "osenzen"
Responsibles: "osenzen"
}
Factor {
Index: 683
CppName: "FI_HAS_DOWNLOAD_LINK_ON_FILE_HOSTING"
Name: "HasDownloadLinkOnFileHosting"
Ticket: "ROBOT-2682"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/HasDownloadLinkOnFile>"
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The document has a link to the file on the hosting"
Authors: "osenzen"
Responsibles: "osenzen"
}
Factor {
Index: 684
CppName: "FI_DIVERSITY_CATEG_DOWNLOAD"
Name: "DiversityCategDownload"
DependsOn: [{Feature: ["DiversityCategDownload"], Slice: "begemot_query_factors"}]
Ticket: "ROBOT-2688"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/DiversityCategFactors>"
Group: "Query"
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_DEPRECATED]
Description: "0 or 1 - whether the query matches the regular expression from the ticket"
Authors: "stasd07"
Responsibles: "stasd07"
}
Factor {
Index: 685
CppName: "FI_DIVERSITY_CATEG_REVIEW"
Name: "DiversityCategReview"
DependsOn: [{Feature: ["DiversityCategReview"], Slice: "begemot_query_factors"}]
Ticket: "ROBOT-2688"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/DiversityCategFactors>"
Group: "Query"
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_UNDOCUMENTED, TG_L2, TG_DEPRECATED]
Description: "0 or 1 - whether the query matches the regular expression from the ticket"
Authors: "stasd07"
Responsibles: "stasd07"
}
Factor {
Index: 686
CppName: "FI_DIVERSITY_CATEG_WATCH"
Name: "DiversityCategWatch"
DependsOn: [{Feature: ["DiversityCategWatch"], Slice: "begemot_query_factors"}]
Ticket: "ROBOT-2688"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/DiversityCategFactors>"
Group: "Query"
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_UNDOCUMENTED, TG_L2, TG_DEPRECATED]
Description: "0 or 1 - whether the query matches the regular expression from the ticket"
Authors: "stasd07"
Responsibles: "stasd07"
}
Factor {
Index: 687
CppName: "FI_TUR_QR"
Name: "QrTur"
DependsOn: [{Feature: ["QrTur"], Slice: "begemot_query_factors"}]
Ticket: "QREG-27"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/QrTur>"
Group: "Query"
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_UNDOCUMENTED, TG_L2, TG_REARR_USE, TG_DEPRECATED]
Description: "Prediction of the percentage of "good" (at least with two different cities and frequency>=10) mentions of the query with geography in Turkey"
Authors: "esoloviev"
Responsibles: "esoloviev"
}
Factor {
Index: 688
CppName: "FI_QUERY_TH3561"
Name: "QueryThEncyclopedic"
DependsOn: [{Feature: ["QueryThEncyclopedic"], Slice: "begemot_query_factors"}]
Ticket: "QREG-28"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/Th3561>"
Group: "Query"
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_THEME_CLASSIF, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_UNDOCUMENTED, TG_L2, TG_DEPRECATED]
Description: "The result of the lexical query classifier that predicts the probability of a click on a topic page 3561"
Authors: "esoloviev"
Responsibles: "esoloviev"
}
Factor {
Index: 689
CppName: "FI_QUERY_TH3973"
Name: "QueryThVideohosting"
DependsOn: [{Feature: ["QueryThVideohosting"], Slice: "begemot_query_factors"}]
Ticket: "QREG-28"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/Th3561>"
Group: "Query"
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_THEME_CLASSIF, TG_USER, TG_UNDOCUMENTED, TG_L2, TG_DEPRECATED]
Description: "The result of the lexical query classifier that predicts the probability of a click on a topic page 3973"
Authors: "esoloviev"
Responsibles: "esoloviev"
}
Factor {
Index: 690
CppName: "FI_QUERY_IS_NAV_MX"
Name: "IsNavMxQuery"
DependsOn: [{Feature: ["IsNavMxQuery"], Slice: "begemot_query_factors"}]
Ticket: "SEARCHSPAM-3647"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/IsNavMxQuery>"
Group: "Query"
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_NAV, TG_TRANS, TG_UNDOCUMENTED, TG_L2, TG_REARR_USE, TG_DEPRECATED]
Countries: CNT_RU
Description: "Query 'navigation' rank"
Authors: ["anelyubin", "kvn"]
Responsibles: ["anelyubin", "kvn"]
DependsOn: [{Feature: ["QueryNonCommerciality", "TovarCategoryQuery", "TovarCategoryVendor", "IsNavQuery", "QClassDownload", "QClassBrandnames", "QClassDisease", "QClassKak", "QClassMoscow", "QClassOAO", "QClassPorno", "QClassTravel", "CountryPopularQ"]}]
}
Factor {
Index: 691
CppName: "FI_QUERY_URL_YABAR_VISITS_REG"
Name: "QueryUrlYabarVisits_Reg"
Ticket: "BUKI-1180"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/YabarUrlFactors>"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_REGION, TG_USER, TG_BROWSER, TG_USER_SEARCH, TG_USER_EXT_DATA, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_238D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_VISITS_ACTIVITY_DOWNLOADS, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Description: "Regional usage of the search engine with a specific query"
Authors: "akhropov"
Responsibles: ["tarum", "niknik"]
}
Factor {
Index: 692
CppName: "FI_CLICKED_WITH_ANOTHER_SE_CLICKS"
Name: "ClickedWithAnotherSEClicks"
Ticket: "BUKI-1261"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ShowsAndClicksWithAnotherSEClicks>"
Tags: [TG_STATIC, TG_DOC, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_UNDOCUMENTED, TG_L2, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_USF, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Description: "Clicks on the URLs shown in the search results for queries that people went to searched for in other search engines"
Authors: "vvp"
Responsibles: ["alsafr", "tarum", "niknik"]
}
Factor {
Index: 693
CppName: "FI_SHOWS_WITH_ANOTHER_SE_CLICKS"
Name: "ShowsWithAnotherSEClicks"
Ticket: "BUKI-1261"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ShowsAndClicksWithAnotherSEClicks>"
Tags: [TG_STATIC, TG_DOC, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_UNDOCUMENTED, TG_L2, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_USF, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Description: "Showing URLs in the SERP for queries that people went to searched for in other search engines"
Authors: "vvp"
Responsibles: ["alsafr", "tarum", "niknik"]
}
Factor {
Index: 694
CppName: "FI_COMMERCIAL_OWNER_RANK_REG"
Name: "CommercialOwnerRank_Reg"
Ticket: ["BUKI-1503", "SEARCHSPAM-3082", "SEARCHSPAM-3486"]
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/CommercialOwnerRank_Reg>"
Group: "RegHostStatic"
Tags: [TG_STATIC, TG_OWNER, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_COMMERCIAL, TG_THEME_CLASSIF, TG_UNDOCUMENTED, TG_L2, TG_MASCOT, TG_DEPRECATED]
Countries: [CNT_RU, CNT_TR]
Description: "The level of commercialy of the website (classifier)"
Authors: ["anelyubin", "sisoid"]
Responsibles: "efedina"
}
Factor {
Index: 695
CppName: "FI_HOST_IS_MARKET_OFFER"
Name: "HostIsMarketOffer"
Ticket: "COMMERCIAL-41"
Authors: ["hygge", "alejes"]
Responsibles: ["hygge", "alejes"]
Description: "The latest version of the market database contains offers from this host."
Tags: [TG_OWNER, TG_STATIC, TG_OFTEN_ZERO, TG_NN_OVER_FEATURES_USE]
ImplementationTime: "2020-09-23"
}
Factor {
Index: 696
CppName: "FI_BCLM_MAX"
Name: "BclmMax"
Ticket: "BUKI-1575"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/BclmMax>"
Group: "CombinedAbs"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_NN_OVER_FEATURES_USE]
Description: "The proximity of the query words to the most difficult word."
Authors: "alsafr"
Responsibles: "alsafr"
}
Factor {
Index: 697
CppName: "FI_URL_PRON_REGEXP_MATCH"
Name: "UrlPronRegexpMatch"
Ticket: "SEARCH-10629"
Tags: [TG_URL_TEXT, TG_UNUSED, TG_BINARY]
Description: "The url matches the regexp expression specified in the pron"
Authors: "timuratshin"
Responsibles: "timuratshin"
}
Factor {
Index: 698
CppName: "FI_HAS_USER_REVIEWS"
Name: "HasUserReviews"
Ticket: "ROBOT-2571"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/HasUserReviews>"
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "Document contains user feedback/comment"
Authors: ["bogomolov", "kartynnik", "osenzen"]
Responsibles: ["kartynnik", "osenzen"]
}
Factor {
Index: 699
CppName: "FI_REGEX_MAX_CLICK_PERCENT_REG"
Name: "RegexMaxClickPercentReg"
Ticket: "BUKI-1300"
Wiki: "<http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/regexmaxclickpercent>"
Group: "Regex"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_L2, TG_DEPRECATED]
Countries: CNT_RELEV
Description: "The ratio of clicks on this URL to all clicks on similar queries, country version, see ((<http://wiki.yandex-team.ru/Development/Poisk/arcadia/indexregex> indexregex))"
Authors: ["finder", "kcd"]
Responsibles: ["smikler", "tsimkha"]
}
Factor {
Index: 700
CppName: "FI_REGEX_CTR_REG"
Name: "RegexCtrReg"
Ticket: "BUKI-1300"
Wiki: "<http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/regexctr>"
Group: "Regex"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_L2, TG_DEPRECATED]
Countries: CNT_RELEV
Description: "corrected CTR of this URL for all related queries, country version, see ((<http://wiki.yandex-team.ru/Development/Poisk/arcadia/indexregex> indexregex))"
Authors: ["finder", "kcd"]
Responsibles: ["smikler", "tsimkha"]
}
Factor {
Index: 701
CppName: "FI_FOUND"
Name: "Found"
DependsOn: [{Feature: ["Found"], Slice: "begemot_query_factors"}]
Wiki: "<http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/Found>"
Group: "Query"
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_L2, TG_USERFEAT, TG_USERFEAT_90D, TG_DEPRECATED]
Countries: CNT_ALL
Description: "Average number of search results for the query"
Authors: "denplusplus"
Responsibles: ["tarum", "niknik"]
}
Factor {
Index: 702
CppName: "FI_YABAR_WORD_DNGI"
Name: "YabarWordDepthNodesGradientMin"
DependsOn: [{Feature: ["YabarWordDepthNodesGradientMin"], Slice: "begemot_query_factors"}]
Ticket: "BUKI-1482"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/HostStatistics>"
Group: "Query"
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_USER, TG_BROWSER, TG_USER_SEARCH, TG_L2, TG_DEPRECATED]
Description: "Angle in Depth Nodes space, counted based words only (Min by all)"
Authors: ["atolstikov", "smikler"]
Responsibles: ["atolstikov", "smikler"]
}
Factor {
Index: 703
CppName: "FI_DBM15_WARES"
Name: "DBM15Wares"
Ticket: "BUKI-1300"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/RegexCtr>"
Group: "CombinedAbs"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_NN_OVER_FEATURES_USE]
Authors: "denplusplus"
Responsibles: "alsafr"
}
Factor {
Index: 704
CppName: "FI_RANK_COM_GOODNESS_BAR"
Name: "RankComGoodnessBar"
Ticket: ["SEARCHSPAM-3759", "SEARCHSPAM-3970"]
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/RankComGoodnessBar>"
Tags: [TG_STATIC, TG_OWNER, TG_LOCALIZED_COUNTRY, TG_USER, TG_BROWSER, TG_COMMERCIAL, TG_THEME_CLASSIF, TG_UNDOCUMENTED, TG_L2, TG_MASCOT, TG_NN_OVER_FEATURES_USE]
Countries: CNT_RU
Description: "A classifier that approximates the quality of commercial sites based on user behavior data"
Authors: ["reat", "sisoid"]
Responsibles: "efedina"
}
Factor {
Index: 705
CppName: "FI_DOC_CREATE_MONTH"
Name: "DocCreateMonth"
Ticket: "BUKI-1583"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/DocMonthFactors>"
Tags: [TG_DATE, TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_DEPRECATED, TG_UNDOCUMENTED, TG_L2]
Description: "Document creation time with the accuracy to the month 1.0 -- current month, 0 --- 10 years ago and older. Temporarily disabled"
Authors: "bochkarev"
Responsibles: "bochkarev"
}
Factor {
Index: 706
CppName: "FI_DOC_UPDATE_MONTH"
Name: "DocUpdateMonth"
Ticket: "BUKI-1583"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/DocMonthFactors>"
Tags: [TG_DATE, TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_DEPRECATED, TG_UNDOCUMENTED, TG_L2]
Description: "Document update time with the accuracy to the month 1.0 -- current month, 0 --- 10 years ago and older. Temporarily disabled"
Authors: "bochkarev"
Responsibles: "bochkarev"
}
Factor {
Index: 707
CppName: "FI_LR_SOURCERANK"
Name: "XLRSourceRank"
Wiki: "<https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/XLR-SourceRank-MainPage>"
Group: "Xref"
Tags: [TG_DYNAMIC, TG_LINK_GRAPH, TG_UNDOCUMENTED, TG_LINK_TEXT, TG_DEPRECATED]
Authors: "denplusplus"
Responsibles: "alsafr"
}
Factor {
Index: 708
CppName: "FI_LR_MAINPAGE"
Name: "XLRMainPage"
Wiki: "<https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/XLR-SourceRank-MainPage>"
Group: "Xref"
Tags: [TG_DYNAMIC, TG_LINK_GRAPH, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_LINK_TEXT, TG_DEPRECATED]
Authors: "denplusplus"
Responsibles: "alsafr"
}
Factor {
Index: 709
CppName: "FI_DATER_STATS_YEAR_NORM_LIKELIHOOD"
Name: "DaterStatsYearNormLikelihood"
Ticket: "BUKI-1619"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/DaterStatsYearNormLikelihood>"
Tags: [TG_DATE, TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The function of the correctness of years distribution in a document. Temporarily disabled"
Authors: "bochkarev"
Responsibles: "bochkarev"
}
Factor {
Index: 710
CppName: "FI_HOST_NUM_SOVETNIK"
Name: "HostNumSovetnik"
Ticket: "CONTENTQUALITY-45"
Authors: ["sdormidontov"]
Responsibles: ["ulyanov", "sdormidontov"]
Description: "Num of Sovetnik urls"
Tags: [TG_HOST, TG_STATIC, TG_OFTEN_ZERO, TG_UNUSED, TG_UNIMPLEMENTED],
}
Factor {
Index: 711
CppName: "FI_LCM_VAR"
Name: "LcmVar"
Ticket: "BUKI-1622"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/LocmVar>"
Group: "Xref"
Tags: [TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: "Dispersion of the number of query words in links."
Authors: "alsafr"
Responsibles: "alsafr"
}
Factor {
Index: 712
CppName: "FI_DATER_STATS_AVERAGE_SOURCE_SEGMENT"
Name: "DaterStatsAverageSourceSegment"
Ticket: "BUKI-1619"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/DaterStatsAverageSourceSegment>"
Tags: [TG_DATE, TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The arithmetic mean of the positions of the dates in the document. Temporarily disabled"
Authors: "bochkarev"
Responsibles: "bochkarev"
}
Factor {
Index: 713
CppName: "FI_DBM15_WARES2"
Name: "DBM15Wares2"
Ticket: "BUKI-1300"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/RegexCtr>"
Group: "CombinedAbs"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_NN_OVER_FEATURES_USE]
Authors: "alsafr"
Responsibles: "alsafr"
}
Factor {
Index: 714
CppName: "FI_CABM"
Name: "Cabm"
Ticket: "BUKI-1629"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/Cabm>"
Group: "Xref"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_LINK_TEXT, TG_DEPRECATED]
Description: "BM with fading on the text of catalog links."
Authors: "alsafr"
Responsibles: "alsafr"
}
Factor {
Index: 715
CppName: "FI_BEAST_NQUERY_URL_MEAN_POS"
Name: "BeastNqUrlMeanPos"
Ticket: "BUKI-1581"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/BeastNqSiteMeanPos>"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_BROWSER, TG_BEAST, TG_DOPP, TG_UNDOCUMENTED, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_365D, TG_NN_OVER_FEATURES_USE, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Countries: CNT_TR
Description: "Average url position for the query"
Authors: ["solar", "vvp"]
Responsibles: ["solar", "alsafr", "tarum", "niknik"]
}
Factor {
Index: 716
CppName: "FI_BEAST_NQUERY_OWNER_MEAN_POS"
Name: "BeastNqOwnerMeanPos"
Ticket: "BUKI-1581"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/BeastNqSiteMeanPos>"
Tags: [TG_DYNAMIC, TG_DOWNER, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_BROWSER, TG_BEAST, TG_DOPP, TG_USER_SEARCH_EXTERNAL, TG_UNDOCUMENTED, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_365D, TG_NN_OVER_FEATURES_USE, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Countries: CNT_TR
Description: "Average position of domAttr for the query"
Authors: ["solar", "vvp"]
Responsibles: ["solar", "alsafr", "tarum", "niknik"]
}
Factor {
Index: 717
CppName: "FI_BEAST_URL_MEAN_POS"
Name: "BeastUrlMeanPos"
Ticket: "BUKI-1581"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/BeastSiteMeanPos>"
Group: "RegDocStatic"
Tags: [TG_STATIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_BROWSER, TG_USER_EXT_DATA, TG_BEAST, TG_UNDOCUMENTED, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_365D, TG_NN_OVER_FEATURES_USE]
Countries: CNT_TR
Description: "The average position of the URL for all queries."
Authors: ["solar", "vvp"]
Responsibles: ["solar", "alsafr", "tarum", "niknik"]
}
Factor {
Index: 718
CppName: "FI_BEAST_HOST_MEAN_POS"
Name: "BeastHostMeanPos"
Ticket: "BUKI-1581"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/BeastSiteMeanPos>"
Group: "RegHostStatic"
Tags: [TG_STATIC, TG_HOST, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_BROWSER, TG_USER_EXT_DATA, TG_BEAST, TG_UNDOCUMENTED, TG_L2, TG_DEPRECATED]
Countries: CNT_TR
Description: "The average position of the host for all queries."
Authors: ["solar", "vvp"]
Responsibles: ["solar", "alsafr"]
}
Factor {
Index: 719
CppName: "FI_BEAST_URL_NUM_QUERIES"
Name: "BeastUrlNumQueries"
Ticket: "BUKI-1581"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/BeastSiteNumQueries>"
Group: "RegDocStatic"
Tags: [TG_STATIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_BROWSER, TG_USER_EXT_DATA, TG_BEAST, TG_UNDOCUMENTED, TG_L2, TG_DEPRECATED]
Countries: CNT_TR
Description: "The number of queries for the URL."
Authors: ["solar", "vvp"]
Responsibles: ["solar", "alsafr"]
}
Factor {
Index: 720
CppName: "FI_BEAST_HOST_NUM_QUERIES"
Name: "BeastHostNumQueries"
Ticket: "BUKI-1581"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/BeastSiteNumQueries>"
Group: "RegHostStatic"
Tags: [TG_STATIC, TG_HOST, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_BROWSER, TG_USER_EXT_DATA, TG_BEAST, TG_UNDOCUMENTED, TG_L2, TG_USERFEAT, TG_USERFEAT_365D, TG_NN_OVER_FEATURES_USE]
Countries: CNT_TR
Description: "The number of queries for the host."
Authors: ["solar", "vvp"]
Responsibles: ["solar", "alsafr", "tarum", "niknik"]
}
Factor {
Index: 721
CppName: "FI_YABAR_HOST_BROWSE_RANK_REG"
Name: "YabarHostBrowseRank_Reg"
Ticket: ["BUKI-1652", "FACTOR-56"]
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/YaBarLogs>"
Group: "RegHostStatic"
Tags: [TG_STATIC, TG_HOST, TG_USER, TG_BROWSER, TG_USER_EXT_DATA, TG_LOCALIZED_COUNTRY, TG_UNIMPLEMENTED, TG_L2]
Countries: CNT_RELEV
Description: "The implementation of the algorithm described in the article ((<http://wiki.yandex-team.ru//h.yandex.net/?http%3A%2F%2Fresearch.microsoft.com%2Fen-us%2Fpeople%2Ftyliu%2Ffp032-liu.pdf> <http://research.microsoft.com/en-us/people/tyliu/fp032-liu.pdf>)) for large regions (TRUBK)."
Authors: "akhropov"
Responsibles: "akhropov"
}
Factor {
Index: 722
CppName: "FI_REMOVED_722"
Name: "Removed_722"
Tags: [TG_REMOVED]
}
Factor {
Index: 723
CppName: "FI_SEGMENT_WORD_PORTION_FROM_MAINCONTENT"
Name: "SegmentWordPortionFromMainContent"
Ticket: "BUKI-1671"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/SegmentWordPortionFromMaincontent>"
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The percentage of words in the document from segments with a score > 2."
Authors: "nordic"
Responsibles: "nordic"
}
Factor {
Index: 724
CppName: "FI_URL_DOMAIN_SIMILARITY_FIXED"
Name: "UrlDomainSimilarityFixed"
Ticket: "BUKI-1647"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/urldomainsimilarity>"
Group: "Dynamic"
Tags: [TG_HOST, TG_DYNAMIC, TG_URL_TEXT, TG_UNDOCUMENTED, TG_REARR_USE, TG_L2, TG_NN_OVER_FEATURES_USE, TG_FORMULA_2245_DEP_2, TG_DEPRECATED]
Authors: "alsafr"
Responsibles: "alsafr"
}
Factor {
Index: 725
CppName: "FI_TOTAL_DUPS"
Name: "TotalDups"
Ticket: "FORMULATOR-185"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/IsIndexPage>"
Tags: [TG_DOC, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_NN_OVER_FEATURES_USE]
Authors: "smikler"
Responsibles: "alsafr"
}
Factor {
Index: 726
CppName: "FI_RANK_BOOST_GOODNESS"
Name: "RankBoostGoodness"
Ticket: ["FACTOR-32", "SEARCHSPAM-3858", "SEARCHSPAM-4133"]
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/RankBoostGoodness>"
Tags: [TG_COMMERCIAL, TG_OWNER, TG_STATIC, TG_LOCALIZED_COUNTRY, TG_UNDOCUMENTED, TG_L2, TG_MASCOT, TG_NN_OVER_FEATURES_USE]
Countries: CNT_RU
Description: "The site quality rank used for boosts in the Moscow commercial formula."
Authors: ["burmisha", "sisoid"]
Responsibles: "efedina"
}
Factor {
Index: 727
CppName: "FI_QUERY_DOWNER_CLICKS_FRC_REG_GEO"
Name: "QueryDOwnerClicksFRCRegGeo"
Ticket: "QREG-31"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/GeoClicks>"
Tags: [TG_DYNAMIC, TG_DOWNER, TG_LOCALIZED_CITY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_USER_SEARCH_EXTERNAL, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_90D, TG_USERFEAT_CLICKS_SHOWS, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Authors: "esoloviev"
Responsibles: ["esoloviev", "yazevnul", "niknik", "tarum"]
}
Factor {
Index: 728
CppName: "FI_QUERY_URL_CLICKS_FRC_REG_GEO"
Name: "QueryURLClicksFRCRegGeo"
Ticket: "QREG-31"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/GeoClicks>"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_CITY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_90D, TG_USERFEAT_CLICKS_SHOWS, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Authors: "esoloviev"
Responsibles: ["esoloviev", "yazevnul", "niknik", "tarum"]
}
Factor {
Index: 729
CppName: "FI_LANGUAGE_DISTRIBUTION"
Name: "LanguageDistribution"
Ticket: "BUKI-1396"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/LanguageDistribution>"
Tags: [TG_DYNAMIC, TG_DOC, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_UNDOCUMENTED, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_CLICKS_SHOWS, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Authors: "avatar"
Responsibles: ["avatar", "tarum", "niknik"]
}
Factor {
Index: 730
CppName: "FI_URL_SHOWS_WITH_NEXT_PAGE_CLICKS_P1"
Name: "UrlShowsWithNextPageClicksP1"
Ticket: "BUKI-1549"
Wiki: "<http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/obshayaformula/tekushhiekomponenty/ShowsWithNextPageClicks>"
Group: "RegDocStatic"
Tags: [TG_LOCALIZED_COUNTRY, TG_STATIC, TG_DOC, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_USF, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Authors: "morph"
Responsibles: ["alsafr", "tarum", "niknik"]
}
Factor {
Index: 731
CppName: "FI_URL_SHOWS_WITH_NEXT_PAGE_CLICKS_P10"
Name: "UrlShowsWithNextPageClicksP10"
Ticket: "BUKI-1549"
Wiki: "<http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/obshayaformula/tekushhiekomponenty/ShowsWithNextPageClicks>"
Description: "The factor used in SelectionRank. TG_UNUSED: should not be included in formulas."
Group: "RegDocStatic"
Tags: [TG_LOCALIZED_COUNTRY, TG_STATIC, TG_DOC, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_UNUSED, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2]
Authors: "morph"
Responsibles: "alsafr"
}
Factor {
Index: 732
CppName: "FI_URL_CLICKS_PCTR_YEAR"
Name: "QueryURLClicksPCTRYear"
AntiSeoUpperBound: 0.6
Tags: [TG_DYNAMIC, TG_DOC, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_REARR_USE, TG_UNUSED, TG_OFTEN_ZERO]
Ticket: "BUKI-1658"
Wiki: "<http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/obshayaformula/tekushhiekomponenty/QueryUrlClicksPCTRYear>"
Authors: "apos"
Responsibles: "apos"
}
Factor {
Index: 733
CppName: "FI_URL_CLICKS_PCTR_YEARP"
Name: "QueryURLClicksPCTRPreviousYear"
AntiSeoUpperBound: 0.6
Ticket: "BUKI-1658"
Tags: [TG_DYNAMIC, TG_DOC, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_REARR_USE, TG_UNUSED, TG_OFTEN_ZERO]
Wiki: "<http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/obshayaformula/tekushhiekomponenty/QueryUrlClicksPCTRYear>"
Authors: "apos"
Responsibles: "apos"
}
Factor {
Index: 734
CppName: "FI_SMALL_WINDOW_ATTENUATION"
Name: "SmallWindowAttenuation"
Ticket: "FACTOR-28"
Wiki: "<http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/obshayaformula/tekushhiekomponenty/SmallWindow>"
Group: "CombinedAbs"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_DEPRECATED]
Responsibles: "alsafr"
}
Factor {
Index: 735
CppName: "FI_RC_SEARCH_BASE_URL_RATIONAL_SIGMOID_D3T120_AT_REQ"
Name: "RcSearchBaseUrlRationalSigmoidD3T120AtReq"
Group: "RapidClicks"
Tags: [TG_STATIC, TG_DOC, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_L2, TG_SEARCH_RAPID_CLICKS_BIGRT, TG_DATA_FROM_BIGRT, TG_UNDOCUMENTED, TG_UNUSED]
Description: "URL feature computed at the request time from rapid clicks search counters with decay of 3 days"
Ticket: "USERFEAT-1503"
Authors: ["skorodumov-s"]
Responsibles: ["skorodumov-s", "tarum"]
ImplementationTime: "2020-10-04"
}
Factor {
Index: 736
CppName: "FI_OWNER_CTR_WITH_NEXT_PAGE_CLICKS_P10"
Name: "OwnerCTRWithNextPageClicksP10"
Ticket: "FACTOR-30"
Wiki: "<http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/obshayaformula/tekushhiekomponenty/ShowsWithNextPageClicks>"
Group: "RegHostStatic"
Tags: [TG_LOCALIZED_COUNTRY, TG_STATIC, TG_OWNER, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_OFTEN_ZERO, TG_L2, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_USF, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Authors: "vvp"
Responsibles: ["alsafr", "tarum", "niknik"]
}
Factor {
Index: 737
CppName: "FI_COMM_RUS"
Name: "CommRus"
Ticket: ["FACTOR-31", "SEARCHSPAM-3722"]
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/CommRus>"
Tags: [TG_COMMERCIAL, TG_DOC, TG_STATIC, TG_LOCALIZED_COUNTRY, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Countries: CNT_RU
Description: "Weight of the document based on a single-word commercial lexicon."
Authors: "sisoid"
Responsibles: ["bikulov", "ashagarov"]
}
Factor {
Index: 738
CppName: "FI_WIKI_LINK_COUNT"
Name: "WikiLinkCount"
Ticket: "FACTOR-54"
Wiki: "<http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/obshayaformula/tekushhiekomponenty/WikiLinkCount>"
Tags: [TG_DOC, TG_LINK_GRAPH, TG_STATIC, TG_USER, TG_WIKIPEDIA, TG_UNDOCUMENTED, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_1D, TG_NN_OVER_FEATURES_USE]
Authors: ["sokirko", "bogomolov"]
Responsibles: ["alsafr", "tarum", "niknik"]
}
Factor {
Index: 739
CppName: "FI_URL_IN_LINKS_TRIGRAMS_STATIC"
Name: "UrlInLinksTrigramsStatic"
Ticket: "FACTOR-43"
Wiki: "<http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/UrlLinksTrigramsStatic>"
Tags: [TG_DOC, TG_LINK_TEXT, TG_STATIC, TG_URL_TEXT, TG_L2, TG_UNUSED]
Authors: "vvp"
Responsibles: "alsafr"
}
Factor {
Index: 740
CppName: "FI_LINKS_IN_URL_TRIGRAMS_STATIC"
Name: "LinksInUrlTrigramsStatic"
Ticket: "FACTOR-43"
Wiki: "<http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/UrlLinksTrigramsStatic>"
Tags: [TG_DOC, TG_LINK_TEXT, TG_STATIC, TG_URL_TEXT, TG_L2, TG_UNUSED]
Authors: "vvp"
Responsibles: "alsafr"
}
Factor {
Index: 741
CppName: "FI_UKR_IS_QUERY_LANG"
Name: "UkrIsQueryLang"
Ticket: "FACTOR-51"
Wiki: "<http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/obshayaformula/tekushhiekomponenty/UkrIsQueryLang>"
Tags: [TG_QUERY_ONLY, TG_BINARY, TG_DYNAMIC, TG_UNDOCUMENTED, TG_NN_OVER_FEATURES_USE]
Description: "Indicates that the query is in the Ukrainian language."
Authors: "vvp"
Responsibles: "alsafr"
}
Factor {
Index: 742
CppName: "FI_QUERIES_AVG_CM2"
Name: "QueriesAvgCM2"
Ticket: "FACTOR-66"
Wiki: "<http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/obshayaformula/tekushhiekomponenty/QueriesAvgCM2>"
Tags: [TG_STATIC, TG_OWNER, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_COMMERCIAL, TG_L2, TG_MASCOT, TG_UNDOCUMENTED, TG_NN_OVER_FEATURES_USE]
Countries: [CNT_RU, CNT_TR]
Description: "Average query commerciality"
Authors: ["burmisha", "sisoid"]
Responsibles: "efedina"
}
Factor {
Index: 743
CppName: "FI_QI_QUERY_COUNT"
Name: "QiQueryCount"
Group: "QI"
Ticket: "FACTOR-63"
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_L2, TG_USER_SEARCH_EXTERNAL, TG_DEPRECATED]
Description: "The number of queries in a group of frequent queries similar to the given one."
Authors: ["agorodilov", "morph"]
Responsibles: ["smikler", "tsimkha"]
Wiki: "<https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/oldqifactors>"
}
Factor {
Index: 744
CppName: "FI_QI_URL_FREQ_WEIGHTED_FRC"
Name: "QiUrlFreqWeightedFRC"
Group: "QI"
Ticket: "FACTOR-63"
Tags: [TG_DYNAMIC, TG_DOC, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_L2, TG_DEPRECATED]
Description: "RC (frequency-based relevance criteria) of a group of similar frequent queries to the given query, calculated by taking the average of clicks and impressions."
Authors: ["agorodilov", "morph"]
Responsibles: ["smikler", "tsimkha"]
Wiki: "<https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/oldqifactors>"
}
Factor {
Index: 745
CppName: "FI_QI_URL_FREQ_WEIGHTED_FRC_REG"
Name: "QiUrlFreqWeightedFRCReg"
Group: "QI"
Ticket: "FACTOR-63"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_REGION, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_L2, TG_DEPRECATED]
Countries: CNT_RELEV
Description: "FRC (Frequency of Requests in Clusters) of a group of similar frequent queries to a given query, calculated as the average through the sum of clicks and impressions, based on regional statistics."
Authors: "morph"
Responsibles: ["smikler", "tsimkha"]
Wiki: "<https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/oldqifactors>"
}
Factor {
Index: 746
CppName: "FI_RC_SEARCH_BASE_URL_RATIONAL_SIGMOID_D1TM600_FROZEN"
Name: "RcSearchBaseUrlRationalSigmoidD1TM600Frozen"
Group: "RapidClicks"
Tags: [TG_STATIC, TG_DOC, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_L2, TG_SEARCH_RAPID_CLICKS_BIGRT, TG_DATA_FROM_BIGRT, TG_UNDOCUMENTED, TG_UNUSED]
Description: "URL feature computed from rapid clicks search frozen counters with decay of 1 day"
Ticket: "USERFEAT-1503"
Authors: ["skorodumov-s"]
Responsibles: ["skorodumov-s", "tarum"]
ImplementationTime: "2020-10-04"
}
Factor {
Index: 747
CppName: "FI_WORD_HOST_WIKI_SUM"
Name: "WordHostWikiSum"
Ticket: "BUKI-1515"
Wiki: "<http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/regwordhost>"
Group: "RegWordHost"
Tags: [TG_DYNAMIC, TG_HOST, TG_WIKIPEDIA, TG_LINK_GRAPH, TG_DEPRECATED]
Description: "Relative popularity of the word-host pair, where word is a word from the title of an article in Wikipedia, and host is the host that is referred to in the article."
Authors: "smikler"
Responsibles: ["smikler", "tsimkha"]
}
Factor {
Index: 748
CppName: "FI_REG_WORD_HOST_CLICKS_SUM"
Name: "RegWordHostClicksSum"
Ticket: "BUKI-1515"
Wiki: "<http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/regwordhost>"
Group: "RegWordHost"
Tags: [TG_DYNAMIC, TG_HOST, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_DEPRECATED]
Countries: CNT_RELEV
Description: "The relative clickability of the countryId-word-host triple based on search data from Yandex."
Authors: "smikler"
Responsibles: ["smikler", "tsimkha"]
}
Factor {
Index: 749
CppName: "FI_REG_WORD_HOST_YABAR_SUM"
Name: "RegWordHostYabarSum"
Ticket: "BUKI-1515"
Wiki: "<http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/regwordhost>"
Group: "RegWordHost"
Tags: [TG_DYNAMIC, TG_HOST, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_BROWSER, TG_USER_EXT_DATA, TG_DEPRECATED]
Countries: CNT_RELEV
Description: "Relative clickability of the countryId-word-host triplet based on data from popular search engines using Bar and SimilarGroup logs."
Authors: "smikler"
Responsibles: ["smikler", "tsimkha"]
}
Factor {
Index: 750
CppName: "FI_REGEX_MAX_CLICK_PERCENT_YABAR_REG"
Name: "RegexMaxClickPercentYabarReg"
Ticket: "FACTOR-11"
Wiki: "<http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/regexmaxclickpercent>"
Group: "Regex"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_BROWSER, TG_USER_SEARCH, TG_USER_EXT_DATA, TG_L2, TG_DEPRECATED]
Countries: CNT_RELEV
Description: "The click-through rate of a URL for all clicks on similar queries, as calculated from popular search engine logs."
Authors: ["smikler", "kcd"]
Responsibles: ["smikler", "tsimkha"]
}
Factor {
Index: 751
CppName: "FI_YABAR_HOST_SURFTR_DEPTH_NODES_LEAFLN"
Name: "YabarHostSurfTrDpNdLeafLn"
Ticket: "BUKI-1334"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/HostStatistics>"
Tags: [TG_STATIC, TG_HOST, TG_USER, TG_BROWSER, TG_USER_SEARCH, TG_L2, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_SURFING_TREE]
Description: "The length of Nodes petal calculated for hosts."
Authors: ["atolstikov", "smikler"]
Responsibles: ["atolstikov", "tarum", "niknik"]
}
Factor {
Index: 752
CppName: "FI_YABAR_HOST_SURFTR_NODES_TIME_GRDISP"
Name: "YabarHostSurfTrNdTmGrDsp"
Ticket: "BUKI-1334"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/HostStatistics>"
Tags: [TG_STATIC, TG_HOST, TG_USER, TG_BROWSER, TG_USER_SEARCH, TG_L2, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_SURFING_TREE]
Description: "Variance of angle in Nodes Time space, calculated for hosts."
Authors: ["atolstikov", "smikler"]
Responsibles: ["atolstikov", "tarum", "niknik"] }
Factor {
Index: 753
CppName: "FI_YABAR_HOST_SURFTR_NODES_TIME_LEADFLN90"
Name: "YabarHostSurfTrNdTmLeafLn90"
Ticket: "BUKI-1334"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/HostStatistics>"
Tags: [TG_STATIC, TG_HOST, TG_USER, TG_BROWSER, TG_USER_SEARCH, TG_L2, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_SURFING_TREE]
Description: "The 0.9 quantile of the petal length in the Nodes Time space calculated for hosts."
Authors: ["atolstikov", "smikler"]
Responsibles: ["atolstikov", "tarum", "niknik"]
}
Factor {
Index: 754
CppName: "FI_WORD_HOST_DOWNLOAD_PROBABILITY"
Name: "WordHostDownloadProbability"
Ticket: "FACTOR-44"
Wiki: "<http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/regwordhost>"
Group: "RegWordHost"
Tags: [TG_DYNAMIC, TG_HOST, TG_USER, TG_BROWSER, TG_USER_SEARCH, TG_DEPRECATED]
Description: "The average probability of downloading a file from a host after clicking, based on the words in the query."
Authors: ["osenzen", "smikler"]
Responsibles: ["smikler", "tsimkha"]
}
Factor {
Index: 755
CppName: "FI_NASTY_CONTENT"
Name: "NastyContent"
Ticket: ["FACTOR-113", "SEARCHSPAM-2435"]
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/NastyContent>"
Tags: [TG_STATIC, TG_DOC, TG_THEME_CLASSIF, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "How bad is the content. (low-quality content)"
Authors: "melkov"
Responsibles: "alsafr"
}
Factor {
Index: 756
CppName: "FI_URL_SYNNORM_PCTR"
Name: "SynnormURLPCTR"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_SYNNORM, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_90D, TG_USERFEAT_CLICKS_SHOWS, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Countries: CNT_RELEV
Ticket: "FACTOR-72"
Wiki: "wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/obshayaformula/tekushhiekomponenty/SynnormFeatures"
Description: "CTR based on click data, queries normalized by synsets."
Authors: ["rizar", "ekrokhalev"]
Responsibles: ["tarum", "niknik"]
}
Factor {
Index: 757
CppName: "FI_URL_SYNNORM_PCTR_REG"
Name: "SynnormURLPCTRReg"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_REGION, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_SYNNORM, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_90D, TG_USERFEAT_CLICKS_SHOWS, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Ticket: "FACTOR-72"
Wiki: "wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/obshayaformula/tekushhiekomponenty/SynnormFeatures"
Description: "Regional click-through rate (CTR) based on clicks data, query normalized by synsets."
Authors: ["rizar", "ekrokhalev"]
Responsibles: ["tarum", "niknik"]
}
Factor {
Index: 758
CppName: "FI_URL_QUERY_TRIGRAMS_STATIC"
Name: "UrlQueryTrigramsStatic"
Group: "RegDocStatic"
Tags: [TG_LOCALIZED_COUNTRY, TG_STATIC, TG_DOC, TG_USER, TG_BROWSER, TG_USER_SEARCH, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_UNDOCUMENTED, TG_USERFEAT, TG_USERFEAT_238D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_URL_QUERY_TRIGRAMS]
Ticket: "FACTOR-24"
Wiki: "<http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/obshayaformula/tekushhiekomponenty/UrlQueryTrigramsStatic>"
Description: "Static trigrams intercection of url and queries by which users visited the url."
Authors: "vvp"
Responsibles: ["alsafr", "tarum", "niknik"]
}
Factor {
Index: 759
CppName: "FI_ADV_ASPAM"
Name: "AdvAspam"
Ticket: "BUKI-1757"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/AdvAspam>"
Tags: [TG_COMMERCIAL, TG_OWNER, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_MASCOT, TG_NN_OVER_FEATURES_USE]
Authors: ["burmisha","sisoid"]
Responsibles: "efedina"
}
Factor {
Index: 760
CppName: "FI_HAS_PORNO_QUERY"
Name: "HasPornoQuery"
DependsOn: [{Feature: ["HasPornoQuery"], Slice: "begemot_query_factors"}]
Ticket: "FACTOR-123"
Wiki: "<https://jira.yandex-team.ru/browse/FACTOR-123>"
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_DEPRECATED]
Description: "The result of the “adult” rule of Sorcerer (algorithm name)."
Authors: "zagrebin"
Responsibles: "smikler"
}
Factor {
Index: 761
CppName: "FI_QU_BM15_WEIGHTED"
Name: "QUBm15Weighted"
Group: "Annotation"
Ticket: "FACTOR-21"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/QUFactors>"
Tags: [TG_DYNAMIC, TG_DOC, TG_USER, TG_USER_SEARCH, TG_BROWSER, TG_USER_EXT_DATA, TG_ANNOTATION_FILTER, TG_L2, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_MULTI_PERIOD]
Description: "Weighted BM25 for a query based on the document index - a list of queries that the document was clicked on."
Authors: "alsafr"
Responsibles: "alsafr"
}
Factor {
Index: 762
CppName: "FI_WS_IS_INDEX_PAGE_AND_BOCM"
Name: "WeightedSumIsIndexPageBocm"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_TRANS, TG_NN_OVER_FEATURES_USE]
Ticket: "FACTOR-140"
Authors: ["burmisha", "sisoid"]
Responsibles: "sisoid"
DependsOn: [{Feature: ["IsIndexPage", "Bocm"]}]
}
Factor {
Index: 763
CppName: "FI_WS_IS_INDEX_PAGE_AND_QUERY_IS_NAV_MX"
Name: "WeightedSumIsIndexPageIsNavMxQuery"
Tags: [TG_DEPRECATED, TG_DYNAMIC, TG_DOC, TG_NAV, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_TRANS, TG_NN_OVER_FEATURES_USE]
Countries: CNT_RU
Ticket: "FACTOR-140"
Authors: ["burmisha", "sisoid"]
Responsibles: "sisoid"
DependsOn: [{Feature: ["IsIndexPage", "IsNavMxQuery"]}]
}
Factor {
Index: 764
CppName: "FI_BROWSER_HOST_DOWNLOAD_PROBABILITY"
Name: "BrowserHostDownloadProbability"
Ticket: "FACTOR-44"
Wiki: "<https://jira.yandex-team.ru/browse/FACTOR-44>"
Tags: [TG_STATIC, TG_HOST, TG_USER, TG_BROWSER, TG_USER_SEARCH, TG_L2, TG_DEPRECATED]
Description: "The probability of downloading from a host after the click based on Yandex Bar logs."
Authors: ["osenzen", "smikler"]
Responsibles: "smikler"
}
Factor {
Index: 765
CppName: "FI_NHOP_CHAINS_COUNT_FRC"
Name: "NHopChainsCountFrc"
Group: "RegDocStatic"
Tags: [TG_STATIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_BROWSER, TG_USER_EXT_DATA, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_238D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_NHOP]
Countries: CNT_RELEV
Ticket: "FACTOR-97"
Wiki: "wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/NHopStatic"
Description: "This is a calculation for the ratio of chains that involve the URL in to the total number of chains for a query. The formula is: Number of chains for a query / (Number of chains involving the URL + Number of chains for the query)."
Authors: "vvp"
Responsibles: ["alsafr", "kartynnik", "tarum", "niknik"]
}
Factor {
Index: 766
CppName: "FI_NHOP_IS_FINAL"
Name: "NHopIsFinal"
Group: "RegDocStatic"
Tags: [TG_STATIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_BROWSER, TG_USER_EXT_DATA, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_238D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_NHOP]
Countries: CNT_RELEV
Ticket: "FACTOR-97"
Wiki: "wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/NHopStatic"
Description: "This is a metric that measures the ratio of sequences where a specific URL was the last one, normalized by the total number of sequences that contained that URL."
Authors: "vvp"
Responsibles: ["alsafr", "kartynnik", "tarum", "niknik"]
}
Factor {
Index: 767
CppName: "FI_VISITS_FROM_WIKI"
Name: "VisitsFromWiki"
Group: "RegDocStatic"
Tags: [TG_STATIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_BROWSER, TG_USER_EXT_DATA, TG_WIKIPEDIA, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_VISITS_FROM]
Countries: CNT_RELEV
Ticket: "FACTOR-46"
Wiki: "wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/obshayaformula/tekushhiekomponenty/VisitsFromWiki"
Description: "Traffic from Wikipedia to the URL. Measuring the total number of visitors."
Authors: ["bogomolov", "smikler"]
Responsibles: ["alsafr", "tarum", "niknik"]
}
Factor {
Index: 768
CppName: "FI_RC_SEARCH_BASE_URL_CONTRAST_D30ODD0_9_X_D30T1_FROZEN"
Name: "RcSearchBaseUrlContrastD30Odd0_9_X_D30T1Frozen"
Group: "RapidClicks"
Tags: [TG_STATIC, TG_DOC, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_L2, TG_DATA_FROM_BIGRT, TG_SEARCH_RAPID_CLICKS_BIGRT, TG_UNDOCUMENTED, TG_UNUSED]
Description: "URL feature computed from rapid clicks search frozen counters with decay of 30 days"
Ticket: "USERFEAT-1503"
Authors: ["skorodumov-s"]
Responsibles: ["skorodumov-s", "tarum"]
ImplementationTime: "2020-10-04"
}
Factor {
Index: 769
CppName: "FI_REG_BROWSER_USER_HUB"
Name: "RegBrowserUserHub"
Ticket: "FACTOR-120"
Wiki: "<https://jira.yandex-team.ru/browse/FACTOR-120>"
Tags: [TG_STATIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_BROWSER, TG_USER_EXT_DATA, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_USER_HUB]
Countries: CNT_RELEV
Group: "RegDocStatic"
Description: "A metric for the page's hub status (the number of pages that Yandex Bar users navigate to from this page)."
Authors: ["vvp", "smikler"]
Responsibles: ["smikler", "tarum", "niknik"]
}
Factor {
Index: 770
CppName: "FI_AUX_TITLE_BM25"
Name: "AuxTitleBM25"
Ticket: "FACTOR-160"
Group: "AuxBM25"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_LOCALIZED_CITY, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_DEPRECATED]
Description: "TextBM25 for the title of the user's region based on the text of the title, similar to factor 268."
Authors: "esoloviev"
Responsibles: "esoloviev"
}
Factor {
Index: 771
CppName: "FI_BCLMF"
Name: "Bclmf"
Group: "Annotation"
Ticket: "FACTOR-149"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/QUFactors>"
Tags: [TG_DYNAMIC, TG_DOC, TG_USER, TG_BROWSER, TG_USER_SEARCH, TG_USER_EXT_DATA, TG_DOC_TEXT, TG_LINK_TEXT, TG_ANNOTATION_FILTER, TG_DEPRECATED]
Description: "BCLM for Annotation index, doc text and links."
Authors: "alsafr"
Responsibles: "alsafr"
}
Factor {
Index: 772
CppName: "FI_NO_PRODUCTS_PROBABILITY"
Name: "NoProductsProbability"
Ticket: "COMMERCIAL-64"
Authors: ["hygge", "alejes", "kpolitay"]
Responsibles: ["hygge", "alejes"]
Description: "Dssm prediction of the probability that there are no products on the page based on URL + title."
Tags: [TG_L2, TG_NEURAL, TG_URL_TEXT, TG_STATIC, TG_NN_OVER_FEATURES_USE]
ImplementationTime: "2020-10-04"
}
Factor {
Index: 773
CppName: "FI_PSE_FRC_BROWSER"
Name: "PopularSEFRCBrowser"
Ticket: "FACTOR-193"
Wiki: "<http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/obshayaformula/tekushhiekomponenty/PopularSEFRC>"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_REGION, TG_USER, TG_BROWSER, TG_USER_SEARCH, TG_DOPP, TG_UNDOCUMENTED, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_238D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_POPULAR_SE_FRC, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Description: "FRC (Frequency of Requests from the Browser logs) of a popular search engine."
Authors: ["vvp", "zagrebin", "bogomolov"]
Responsibles: ["alsafr", "tarum", "niknik"]
}
Factor {
Index: 774
CppName: "FI_LOG_CTR_MEAN"
Name: "LogCtrMean"
Ticket: "FACTOR-182"
Wiki: "<http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/LogCtrMean>"
Tags: [TG_STATIC, TG_HOST, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_L2, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_CLICKS_SHOWS, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Description: "Weighted mean of log(query_clicks)/log(query_shows) for the given host. Weights are proportional to log(query_shows) + 0.2."
Authors: "tsimkha"
Responsibles: ["tarum", "niknik"]
}
Factor {
Index: 775
CppName: "FI_QUERY_URL_NHOP_TOTAL_FRC"
Name: "QueryUrlNhopTotalFrc"
Ticket: "FACTOR-145"
Wiki: "<http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/NHopQueryUrl>"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_REGION, TG_USER, TG_BROWSER, TG_USER_EXT_DATA, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_238D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_NHOP, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Description: "This metric measures the number of clicks on the URL in the chain of hops, normalized by the total number of clicks for the query."
Authors: "vvp"
Responsibles: ["alsafr", "tarum", "niknik"]
}
Factor {
Index: 776
CppName: "FI_QUERY_URL_NHOP_IS_FINAL"
Name: "QueryUrlNhopIsFinal"
Ticket: "FACTOR-145"
Wiki: "<http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/NHopQueryUrl>"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_REGION, TG_USER, TG_BROWSER, TG_USER_EXT_DATA, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_238D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_NHOP, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Description: "The probability of a URL being the last one in a sequence of hops for a given query."
Authors: "vvp"
Responsibles: ["alsafr", "tarum", "niknik"]
}
Factor {
Index: 777
CppName: "FI_ONE_PRODUCT_PROBABILITY"
Name: "OneProductProbability"
Ticket: "COMMERCIAL-64"
Authors: ["hygge", "alejes", "kpolitay"]
Responsibles: ["hygge", "alejes"]
Description: "Dssm prediction of the probability based on url + title that there is one product on the page."
Tags: [TG_L2, TG_NEURAL, TG_STATIC, TG_URL_TEXT, TG_NN_OVER_FEATURES_USE]
ImplementationTime: "2020-10-04"
}
Factor {
Index: 778
CppName: "FI_MANY_PRODUCTS_PROBABILITY"
Name: "ManyProductsProbability"
Ticket: "COMMERCIAL-64"
Authors: ["hygge", "alejes", "kpolitay"]
Responsibles: ["hygge", "alejes"]
Description: "Dssm prediction of the probability based on the URL + title that there are many products on the page."
Tags: [TG_L2, TG_NEURAL, TG_STATIC, TG_URL_TEXT, TG_NN_OVER_FEATURES_USE]
ImplementationTime: "2020-10-04"
}
Factor {
Index: 779
CppName: "FI_RC_SEARCH_BASE_URL_RATIONAL_SIGMOID_D3T120_FROZEN"
Name: "RcSearchBaseUrlRationalSigmoidD3T120Frozen"
Group: "RapidClicks"
Tags: [TG_STATIC, TG_DOC, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_L2, TG_SEARCH_RAPID_CLICKS_BIGRT, TG_DATA_FROM_BIGRT, TG_UNDOCUMENTED, TG_UNUSED]
Description: "URL feature computed from rapid clicks search frozen counters with decay of 3 days"
Ticket: "USERFEAT-1503"
Authors: ["skorodumov-s"]
Responsibles: ["skorodumov-s", "tarum"]
ImplementationTime: "2020-10-04"
}
Factor {
Index: 780
CppName: "FI_GEO_CITY_URL_HAS_CITY"
Name: "GeoCityUrlHasCity"
Ticket: "BUKI-1125"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/GeoCityUrl>"
Tags: [TG_DOC, TG_STATIC, TG_STATIC_REGINFO, TG_URL_TEXT, TG_BINARY, TG_DEPRECATED, TG_OFTEN_ZERO, TG_L2]
Description: "The URL has a city-level geolocation defined by the BUKI-1125 rules."
Authors: "denplusplus"
Responsibles: "esoloviev"
}
Factor {
Index: 781
CppName: "FI_GEO_CITY_URL_HAS_COUNTRY"
Name: "GeoCityUrlHasCountry"
Ticket: "BUKI-1125"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/GeoCityUrl>"
Tags: [TG_DOC, TG_STATIC, TG_STATIC_REGINFO, TG_URL_TEXT, TG_BINARY, TG_DEPRECATED, TG_OFTEN_ZERO, TG_L2]
Description: "The country level geolocation for the URL was defined based on the rules of BUKI-1125."
Authors: "denplusplus"
Responsibles: "esoloviev"
}
Factor {
Index: 782
CppName: "FI_GEO_RELEV_REGION_CITY_GEOA"
Name: "GeoRelevRegionCityGeoa"
Ticket: "QREG-41"
Tags: [TG_DOC, TG_DYNAMIC, TG_LOCALIZED_CITY, TG_BINARY, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The Factor GeoRelevRegionCity based on the attribute "geoa"."
Authors: "esoloviev"
Responsibles: "esoloviev"
}
Factor {
Index: 783
CppName: "FI_GEO_RELEV_REGION_REGION_GEOA"
Name: "GeoRelevRegionRegionGeoa"
Ticket: "QREG-41"
Tags: [TG_DOC, TG_DYNAMIC, TG_LOCALIZED_REGION, TG_BINARY, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The factor GeoRelevRegionRegion based on the "geoa" attribute."
Authors: "esoloviev"
Responsibles: "esoloviev"
}
Factor {
Index: 784
CppName: "FI_GEO_GEOMETRY_PROXIM_GEOA"
Name: "GeoGeometryProximGeoa"
Ticket: "QREG-41"
Tags: [TG_DOC, TG_DYNAMIC, TG_LOCALIZED_CITY, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The factor GeoGeometryProxim based on the attribute “geoa”."
Authors: "esoloviev"
Responsibles: "esoloviev"
}
Factor {
Index: 785
CppName: "FI_GEO_RELEV_ALIEN_CITY_GEOA"
Name: "GeoRelevAlienCityGeoa"
Ticket: "QREG-41"
Tags: [TG_DOC, TG_DYNAMIC, TG_LOCALIZED_CITY, TG_BINARY, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The factor GeoRelevAlienCity based on the attribute “geoa”."
Authors: "esoloviev"
Responsibles: "esoloviev"
}
Factor {
Index: 786
CppName: "FI_GEO_V_QUERY_IN_USERS_CITY_GEOA"
Name: "GeoVQueryInUserCityGeoa"
Ticket: "QREG-41"
Tags: [TG_DOC, TG_DYNAMIC, TG_LOCALIZED_CITY, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The factor GeoVQueryInUserCity based on the attribute “geoa”."
Authors: "esoloviev"
Responsibles: "esoloviev"
}
Factor {
Index: 787
CppName: "FI_GEO_V_QUERY_IN_ALIEN_CITY_GEOA"
Name: "GeoVQueryInAlienCityGeoa"
Ticket: "QREG-41"
Tags: [TG_DOC, TG_DYNAMIC, TG_LOCALIZED_CITY, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The Factor GeoVQueryInAlienCity based on the attribute “geoa”."
Authors: "esoloviev"
Responsibles: "esoloviev"
}
Factor {
Index: 788
CppName: "FI_PAGE_REGION_SIZE_GEO"
Name: "PageRegionSizeGeo"
Ticket: "QREG-41"
Tags: [TG_DOC, TG_STATIC, TG_STATIC_REGINFO, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_NN_OVER_FEATURES_USE]
Description: "The Factor PageRegionSiz based on the attribute “geo”."
Authors: "esoloviev"
Responsibles: "esoloviev"
}
Factor {
Index: 789
CppName: "FI_PAGE_REGION_COVERAGE_GEO"
Name: "PageRegionCoverageGeo"
Ticket: "QREG-41"
Tags: [TG_DOC, TG_STATIC, TG_STATIC_REGINFO, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_NN_OVER_FEATURES_USE]
Description: "The Factor PageRegionCoverage based on the attribute “geo”."
Authors: "esoloviev"
Responsibles: "esoloviev"
}
Factor {
Index: 790
CppName: "FI_PAGE_REGION_COVERAGE_ADRESA"
Name: "PageRegionCoverageAdresa"
Ticket: "QREG-41"
Tags: [TG_DOC, TG_STATIC, TG_STATIC_REGINFO, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The Factor PageRegionCoverage based on the attribute “adresa”."
Authors: "esoloviev"
Responsibles: "esoloviev"
}
Factor {
Index: 791
CppName: "FI_GEO_RELEV_REGION_CITY_ADRESA"
Name: "GeoRelevRegionCityAdresa"
Ticket: "QREG-41"
Tags: [TG_DOC, TG_DYNAMIC, TG_LOCALIZED_CITY, TG_BINARY, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "The factor GeoRelevRegionCity based on the attribute “adresa”."
Authors: "esoloviev"
Responsibles: "esoloviev"
}
Factor {
Index: 792
CppName: "FI_DOPP_URL_SESSION_CLICKS_FRC"
Name: "DoppQueryUrlSessionClicksFRC"
Ticket: "FACTOR-127"
Wiki: "<http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/DoppQueryUrlSessionClicksFRC>"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_DOPP, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_90D, TG_USERFEAT_USF, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Countries: CNT_RELEV
Description: "The average ratio of the clicks on the given URL to the total number of clicks on all URL for a given query, based on user sessions."
Authors: "alsafr"
Responsibles: ["kolesov93", "alsafr"]
}
Factor {
Index: 793
CppName: "FI_OWNER_IS_ACTUAL_SHOP"
Name: "OwnerIsActualShop"
Tags: [TG_OWNER, TG_STATIC, TG_L2, TG_COMMERCIAL]
Description: "The owner is a ecommerce store."
Ticket: "COMMERCIAL-62"
Authors: ["miha715lev", "alejes"]
Responsibles: ["miha715lev", "alejes"]
ImplementationTime: "2020-09-30"
}
Factor {
Index: 794
CppName: "FI_OWNER_IS_SERVICE"
Name: "OwnerIsService"
Tags: [TG_OWNER, TG_STATIC, TG_L2, TG_COMMERCIAL, TG_UNUSED, TG_UNIMPLEMENTED]
Description: "The owner is a service business."
Ticket: "COMMERCIAL-62"
Authors: ["miha715lev", "alejes"]
Responsibles: ["miha715lev", "alejes"]
}
Factor {
Index: 795
CppName: "FI_NHOP_TEXT_BCLM_PLANE"
Name: "NHopTextBclmPlane"
Group: "Annotation"
Ticket: "FACTOR-108"
Wiki: "<http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/NHopText>"
Tags: [TG_DYNAMIC, TG_DOC, TG_USER, TG_BROWSER, TG_USER_SEARCH, TG_USER_EXT_DATA, TG_LOCALIZED_COUNTRY, TG_ANNOTATION_FILTER, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_238D, TG_USERFEAT_NHOP]
Countries: CNT_RELEV
Description: "Bclm based on texts from hops."
Authors: "vvp"
Responsibles: "alsafr"
}
Factor {
Index: 796
CppName: "FI_SAME_QUERY_FRC_BROWSER"
Name: "SameQueryReturnFRCBrowser"
Ticket: "FACTOR-234"
Wiki: "<http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/samequeryreturn>"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_BROWSER, TG_USER_SEARCH, TG_DOPP, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_238D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_SAME_QUERY_RETURN, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Countries: CNT_RELEV
Description: "FRC, or Frequency of Recurrent Queries, based on clicks for the given query that was used by the user a few times."
Authors: ["bogomolov", "vvp"]
Responsibles: ["smikler", "tarum", "niknik"]
}
Factor {
Index: 797
CppName: "FI_QUERY_URL_ISBM_CTR"
Name: "QueryURLISBMCTR"
Wiki: "<http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/isbm>"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_SBM, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Countries: CNT_RELEV
Ticket: "FACTOR-65"
Description: "The average weight of impressions on the first page is based on the value assigned to clicks (1) and non-clicks (according to the SBM_GAMMAS table)."
Authors: ["shpilman", "dprpavlin"]
Responsibles: ["dprpavlin", "tarum", "niknik"]
}
Factor {
Index: 798
CppName: "FI_QUERY_URL_ISBM_CTR_REG"
Name: "QueryURLISBMCTRReg"
Wiki: "<http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/isbm>"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_REGION, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_SBM, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Ticket: "FACTOR-65"
Description: "The average weight of impressions on the first page; a click weighs 1, non-click - according to the SBM_GAMMAS table. Regional version."
Authors: ["shpilman", "dprpavlin"]
Responsibles: ["dprpavlin", "tarum", "niknik"]
}
Factor {
Index: 799
CppName: "FI_REGEX_BEAST_POSITION_REG"
Name: "RegexBeastPositionReg"
Ticket: "FACTOR-268"
Wiki: "<http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/regexbeastpositionreg>"
Group: "Regex"
Tags: [TG_DOC, TG_DYNAMIC, TG_USER, TG_USER_SEARCH, TG_BROWSER, TG_USER_EXT_DATA, TG_BEAST, TG_LOCALIZED_COUNTRY, TG_L2, TG_DEPRECATED]
Countries: CNT_TR
Description: "The half-sum of the URL position estimate with the median position across all similar queries based on bista."
Authors: ["avatar", "vvp"]
Responsibles: ["avatar", "smikler", "tsimkha"]
}
Factor {
Index: 800
CppName: "FI_RC_SPYLOG_HOST_RATIONAL_SIGMOID_D3T0_AT_REQ"
Name: "RcSpylogHostRationalSigmoidD3T0AtReq"
Group: "RapidClicks"
Tags: [TG_STATIC, TG_HOST, TG_USER, TG_BROWSER, TG_L2, TG_DATA_FROM_BIGRT, TG_UNDOCUMENTED, TG_UNIMPLEMENTED, TG_UNUSED]
Description: "Host feature computed at the request time from rapid clicks spy_log counters with decay of 3 days"
Ticket: "USERFEAT-1508"
Authors: ["skorodumov-s"]
Responsibles: ["skorodumov-s", "tarum"]
}
Factor {
Index: 801
CppName: "FI_RC_SPYLOG_HOST_RATIONAL_SIGMOID_D3T0DTM3600_AT_REQ"
Name: "RcSpylogHostRationalSigmoidD3DTM3600AtReq"
Group: "RapidClicks"
Tags: [TG_STATIC, TG_HOST, TG_USER, TG_BROWSER, TG_L2, TG_DATA_FROM_BIGRT, TG_UNDOCUMENTED, TG_UNIMPLEMENTED, TG_UNUSED]
Description: "Host feature computed at the request time from rapid clicks spy_log counters with decay of 3 days"
Ticket: "USERFEAT-1508"
Authors: ["skorodumov-s"]
Responsibles: ["skorodumov-s", "tarum"]
}
Factor {
Index: 802
CppName: "FI_RC_SPYLOG_HOST_RATIONAL_SIGMOID_D14T0_AT_REQ"
Name: "RcSpylogHostRationalSigmoidD14T0AtReq"
Group: "RapidClicks"
Tags: [TG_STATIC, TG_HOST, TG_USER, TG_BROWSER, TG_L2, TG_DATA_FROM_BIGRT, TG_UNDOCUMENTED, TG_UNIMPLEMENTED, TG_UNUSED]
Description: "Host feature computed at the request time from rapid clicks spy_log counters with decay of 14 days"
Ticket: "USERFEAT-1508"
Authors: ["skorodumov-s"]
Responsibles: ["skorodumov-s", "tarum"]
}
Factor {
Index: 803
CppName: "FI_RC_SPYLOG_HOST_RATIONAL_SIGMOID_D14DTM3600_AT_REQ"
Name: "RcSpylogHostRationalSigmoidD14DTM3600AtReq"
Group: "RapidClicks"
Tags: [TG_STATIC, TG_HOST, TG_USER, TG_BROWSER, TG_L2, TG_DATA_FROM_BIGRT, TG_UNDOCUMENTED, TG_UNIMPLEMENTED, TG_UNUSED]
Description: "Host feature computed at the request time from rapid clicks spy_log counters with decay of 14 days"
Ticket: "USERFEAT-1508"
Authors: ["skorodumov-s"]
Responsibles: ["skorodumov-s", "tarum"]
}
Factor {
Index: 804
CppName: "FI_RC_SPYLOG_HOST_RATIONAL_SIGMOIDED_CTRD3DT0TM3600_AT_REQ"
Name: "RcSpylogHostRationalSigmoidedCTRD3DT0TM3600AtReq"
Group: "RapidClicks"
Tags: [TG_STATIC, TG_HOST, TG_USER, TG_BROWSER, TG_L2, TG_DATA_FROM_BIGRT, TG_UNDOCUMENTED, TG_UNIMPLEMENTED, TG_UNUSED]
Description: "Host feature computed at the request time from rapid clicks spy_log counters with decay of 3 days"
Ticket: "USERFEAT-1508"
Authors: ["skorodumov-s"]
Responsibles: ["skorodumov-s", "tarum"]
}
Factor {
Index: 805
CppName: "FI_RC_SPYLOG_HOST_RATIONAL_SIGMOIDED_CTRD14DT0TM3600_AT_REQ"
Name: "RcSpylogHostRationalSigmoidedCTRD14DT0TM3600AtReq"
Group: "RapidClicks"
Tags: [TG_STATIC, TG_HOST, TG_USER, TG_BROWSER, TG_L2, TG_DATA_FROM_BIGRT, TG_UNDOCUMENTED, TG_UNIMPLEMENTED, TG_UNUSED]
Description: "Host feature computed at the request time from rapid clicks spy_log counters with decay of 14 days"
Ticket: "USERFEAT-1508"
Authors: ["skorodumov-s"]
Responsibles: ["skorodumov-s", "tarum"]
}
Factor {
Index: 806
CppName: "FI_RC_SPYLOG_HOST_RATIONAL_SIGMOID_D3T0_FROZEN"
Name: "RcSpylogHostRationalSigmoidD3T0Frozen"
Group: "RapidClicks"
Tags: [TG_STATIC, TG_HOST, TG_USER, TG_BROWSER, TG_L2, TG_DATA_FROM_BIGRT, TG_UNDOCUMENTED, TG_UNIMPLEMENTED, TG_UNUSED]
Description: "Host feature computed from rapid clicks spy_log counters with decay of 3 days"
Ticket: "USERFEAT-1508"
Authors: ["skorodumov-s"]
Responsibles: ["skorodumov-s", "tarum"]
}
Factor {
Index: 807
CppName: "FI_RC_SPYLOG_HOST_RATIONAL_SIGMOID_D3T0DTM3600_FROZEN"
Name: "RcSpylogHostRationalSigmoidD3DTM3600Frozen"
Group: "RapidClicks"
Tags: [TG_STATIC, TG_HOST, TG_USER, TG_BROWSER, TG_L2, TG_DATA_FROM_BIGRT, TG_UNDOCUMENTED, TG_UNIMPLEMENTED, TG_UNUSED]
Description: "Host feature computed from rapid clicks spy_log counters with decay of 3 days"
Ticket: "USERFEAT-1508"
Authors: ["skorodumov-s"]
Responsibles: ["skorodumov-s", "tarum"]
}
Factor {
Index: 808
CppName: "FI_RC_SPYLOG_HOST_RATIONAL_SIGMOID_D14T0_FROZEN"
Name: "RcSpylogHostRationalSigmoidD14T0Frozen"
Group: "RapidClicks"
Tags: [TG_STATIC, TG_HOST, TG_USER, TG_BROWSER, TG_L2, TG_DATA_FROM_BIGRT, TG_UNDOCUMENTED, TG_UNIMPLEMENTED, TG_UNUSED]
Description: "Host feature computed from rapid clicks spy_log counters with decay of 14 days"
Ticket: "USERFEAT-1508"
Authors: ["skorodumov-s"]
Responsibles: ["skorodumov-s", "tarum"]
}
Factor {
Index: 809
CppName: "FI_RC_SPYLOG_HOST_RATIONAL_SIGMOID_D14DTM3600_FROZEN"
Name: "RcSpylogHostRationalSigmoidD14DTM3600Frozen"
Group: "RapidClicks"
Tags: [TG_STATIC, TG_HOST, TG_USER, TG_BROWSER, TG_L2, TG_DATA_FROM_BIGRT, TG_UNDOCUMENTED, TG_UNIMPLEMENTED, TG_UNUSED]
Description: "Host feature computed from rapid clicks spy_log counters with decay of 14 days"
Ticket: "USERFEAT-1508"
Authors: ["skorodumov-s"]
Responsibles: ["skorodumov-s", "tarum"]
}
Factor {
Index: 810
CppName: "FI_RC_SPYLOG_HOST_RATIONAL_SIGMOIDED_CTRD3DT0TM3600_FROZEN"
Name: "RcSpylogHostRationalSigmoidedCTRD3DT0TM3600Frozen"
Group: "RapidClicks"
Tags: [TG_STATIC, TG_HOST, TG_USER, TG_BROWSER, TG_L2, TG_DATA_FROM_BIGRT, TG_UNDOCUMENTED, TG_UNIMPLEMENTED, TG_UNUSED]
Description: "Host feature computed from rapid clicks spy_log counters with decay of 3 days"
Ticket: "USERFEAT-1508"
Authors: ["skorodumov-s"]
Responsibles: ["skorodumov-s", "tarum"]
}
Factor {
Index: 811
CppName: "FI_RC_SPYLOG_HOST_RATIONAL_SIGMOIDED_CTRD14DT0TM3600_FROZEN"
Name: "RcSpylogHostRationalSigmoidedCTRD14DT0TM3600Frozen"
Group: "RapidClicks"
Tags: [TG_STATIC, TG_HOST, TG_USER, TG_BROWSER, TG_L2, TG_DATA_FROM_BIGRT, TG_UNDOCUMENTED, TG_UNIMPLEMENTED, TG_UNUSED]
Description: "Host feature computed from rapid clicks spy_log counters with decay of 14 days"
Ticket: "USERFEAT-1508"
Authors: ["skorodumov-s"]
Responsibles: ["skorodumov-s", "tarum"]
}
Factor {
Index: 812
CppName: "FI_COMMERCIAL_DSSM_ODD_LIKE"
Name: "CommercialDssmOddLike"
Tags: [TG_DYNAMIC, TG_DOC, TG_USER, TG_USER_SEARCH, TG_DOC_TEXT, TG_URL_TEXT, TG_NEURAL, TG_COMMERCIAL, TG_RTMODELS_SERVICE, TG_NN_OVER_FEATURES_USE]
Description: "Finetuned reformulations DSSM to commercial clicked bargain odd-like target from visit log"
Ticket: "FORMULA-2001"
Authors: ["alexumnov"]
Responsibles: ["alexumnov"]
ImplementationTime: "2020-11-12"
}
Factor {
Index: 813
CppName: "FI_DISTRIBUTOR_HOSTS"
Name: "DistributorHosts"
Tags: [TG_OWNER, TG_STATIC, TG_OFTEN_ZERO, TG_UNIMPLEMENTED, TG_BINARY, TG_UNUSED]
Description: "Is it a legal video distributor"
Ticket: "SEARCHSPAM-15565"
Authors: ["bikulov"]
Responsibles: ["bikulov", "sdormidontov"]
}
Factor {
Index: 814
CppName: "FI_ONE_PRODUCT_PROBABILITY_AVG"
Name: "OneProductProbabilityAvg"
Ticket: "SEARCHSPAM-15568"
Authors: ["ulyanov"]
Responsibles: ["ulyanov", "bikulov"]
Description: "Average value of the feature OneProductProbability"
Tags: [TG_OWNER, TG_STATIC, TG_OFTEN_ZERO, TG_UNUSED, TG_UNIMPLEMENTED]
}
Factor {
Index: 815
CppName: "FI_MANY_PRODUCTS_PROBABILITY_AVG"
Name: "ManyProductsProbabilityAvg"
Ticket: "SEARCHSPAM-15568"
Authors: ["ulyanov"]
Responsibles: ["ulyanov", "bikulov"]
Description: "Average value of the feature ManyProductsProbability"
Tags: [TG_OWNER, TG_STATIC, TG_OFTEN_ZERO, TG_UNUSED, TG_UNIMPLEMENTED]
}
Factor {
Index: 816
CppName: "FI_PAY_DETECTOR_PREDICT_AVG"
Name: "PayDetectorPredictAvg"
Ticket: "SEARCHSPAM-15568"
Authors: ["ulyanov"]
Responsibles: ["ulyanov", "bikulov"]
Description: "Average value of the feature PayDetectorPredict"
Tags: [TG_OWNER, TG_STATIC, TG_OFTEN_ZERO, TG_UNUSED, TG_UNIMPLEMENTED]
}
Factor {
Index: 817
CppName: "FI_OWNER_IS_PARTNER"
Name: "OwnerIsPartner"
Tags: [TG_OWNER, TG_STATIC, TG_L2, TG_COMMERCIAL, TG_UNUSED, TG_UNIMPLEMENTED]
Description: "The owner is a partner."
Ticket: "COMMERCIAL-90"
Authors: ["miha715lev", "alejes"]
Responsibles: ["miha715lev", "alejes"]
}
Factor {
Index: 818
CppName: "FI_SHOP_IN_SHOP_URL"
Name: "ShopInShopUrl"
Tags: [TG_DOC, TG_STATIC, TG_L2, TG_OFTEN_ZERO, TG_COMMERCIAL, TG_UNUSED, TG_UNIMPLEMENTED]
Description: "The document is a ShopInShop."
Ticket: "COMMERCIAL-135"
Authors: ["miha715lev", "alejes"]
Responsibles: ["miha715lev", "alejes"]
}
Factor {
Index: 819
CppName: "FI_QUERY_CONVERSION_DETECTOR_PREDICT"
Name: "QueryConversionDetectorPredict"
Ticket: "COMMERCIAL-81"
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_USER, TG_L2, TG_QUERY_DETECTOR_PREDICT, TG_NOT_01, TG_UNUSED]
Description: "The conversion rate of the query calculated in Hippo (Name of the algorithm)."
Authors: ["alejes", "hygge"]
Responsibles: ["alejes", "hygge"]
MaxValue: 25.0
MinValue: -25.0
ImplementationTime: "2020-12-01"
}
Factor {
Index: 820
CppName: "FI_FIO_FROM_ORIGINAL_REQUEST_BODY_CHAIN0_WCM"
Name: "FioFromOriginalRequestBodyChain0Wcm"
Ticket: "SEARCHSPEC-94"
Description: "The factor based on the user's Full name from the original query is calculated based on the content of the document using the Chain0Wcm algorithm."
Tags: [TG_DOC, TG_DOC_TEXT, TG_UNDOCUMENTED, TG_UNIMPLEMENTED, TG_TEXT_MACHINE]
}
Factor {
Index: 821
CppName: "FI_PRODUCT_OFFER_ANY_AVAILABLE"
Name: "ProductOfferAnyAvailable"
Ticket: "COMMERCIAL-78"
Authors: ["hygge", "alejes"]
Responsibles: ["hygge", "alejes"]
Description: "This statement means that at least one offer from the parsed data has a status indicating its availability."
Tags: [TG_L2, TG_STATIC, TG_OFTEN_ZERO]
ImplementationTime: "2020-04-07"
}
Factor {
Index: 822
CppName: "FI_PRODUCT_OFFER_NO_PRODUCTS"
Name: "ProductOfferNoProducts"
Ticket: "COMMERCIAL-78"
Authors: ["hygge", "alejes"]
Responsibles: ["hygge", "alejes"]
Description: "There are offers in the parsed data at all."
Tags: [TG_L2, TG_STATIC]
ImplementationTime: "2020-04-07"
}
Factor {
Index: 823
CppName: "FI_BAD_YTIER_URL"
Name: "BadYtierUrl"
Tags: [TG_STATIC, TG_DOC, TG_UNUSED, TG_UNIMPLEMENTED, TG_OFTEN_ZERO, TG_USER_SEARCH, TG_META, TG_L3, TG_PRS]
Authors: "hommforever"
Responsibles: ["hommforever"]
Ticket: "SEARCHSPEC-25"
Wiki: ""
DependsOn: []
Description: "The URL from "ytier" has low-quality content."
}
Factor {
Index: 824
CppName: "FI_NORM_YTIER_URL"
Name: "NormYtierUrl"
Tags: [TG_STATIC, TG_DOC, TG_UNUSED, TG_UNIMPLEMENTED, TG_OFTEN_ZERO, TG_USER_SEARCH, TG_META, TG_L3, TG_PRS]
Authors: "hommforever"
Responsibles: ["hommforever"]
Ticket: "SEARCHSPEC-25"
Wiki: ""
DependsOn: []
Description: "The URL from “ytier” has the acceptable quality of content."
}
Factor {
Index: 825
CppName: "FI_GOOD_YTIER_URL"
Name: "GoodYtierUrl"
Tags: [TG_STATIC, TG_DOC, TG_UNUSED, TG_UNIMPLEMENTED, TG_OFTEN_ZERO, TG_USER_SEARCH, TG_META, TG_L3, TG_PRS]
Authors: "hommforever"
Responsibles: ["hommforever"]
Ticket: "SEARCHSPEC-25"
Wiki: ""
DependsOn: []
Description: "The URL from “ytier” has a pretty good quality of content"
}
Factor {
Index: 826
CppName: "FI_BEST_YTIER_URL"
Name: "BestYtierUrl"
Tags: [TG_STATIC, TG_DOC, TG_UNUSED, TG_UNIMPLEMENTED, TG_OFTEN_ZERO, TG_USER_SEARCH, TG_META, TG_L3, TG_PRS]
Authors: "hommforever"
Responsibles: ["hommforever"]
Ticket: "SEARCHSPEC-25"
Wiki: ""
DependsOn: []
Description: "The URL from “ytier” has a high-quality content"
}
Factor {
Index: 827
CppName: "FI_HOST_IS_ECOM_PURCHASE"
Name: "HostIsEcomPurchase"
Ticket: "COMMERCIAL-124"
Authors: ["hygge", "alejes"]
Responsibles: ["hygge", "alejes"]
Description: "The host offers an option to purchase goods. (Ecommerce)"
Tags: [TG_HOST, TG_STATIC, TG_OFTEN_ZERO, TG_UNUSED, TG_UNIMPLEMENTED]
}
Factor {
Index: 828
CppName: "FI_HOST_IS_VISIT_LOGS_PURCHASE"
Name: "HostIsVisitLogsPurchase"
Ticket: "COMMERCIAL-124"
Authors: ["hygge", "alejes"]
Responsibles: ["hygge", "alejes"]
Description: "The host offers an option to purchase goods, based on visit logs."
Tags: [TG_HOST, TG_STATIC, TG_OFTEN_ZERO, TG_UNUSED, TG_UNIMPLEMENTED]
}
Factor {
Index: 829
CppName: "FI_YANDEX_MARKET_PRODUCT_URL"
Name: "YandexMarketProductUrl"
Tags: [TG_DOC, TG_URL_TEXT, TG_BINARY, TG_OFTEN_ZERO, TG_L2, TG_UNUSED, TG_UNIMPLEMENTED]
Description: "The URL is a product on the Yandex Market."
Ticket: "COMMERCIAL-128"
Authors: ["hygge", "alejes"]
Responsibles: ["hygge", "alejes"]
# ImplementationTime: "2020-12-04"
}
Factor {
Index: 830
CppName: "FI_YANDEX_MARKET_PRODUCT_INCLUDE_OFFERID_URL"
Name: "YandexMarketProductIncludeOfferidUrl"
Tags: [TG_DOC, TG_URL_TEXT, TG_BINARY, TG_OFTEN_ZERO, TG_L2, TG_UNUSED, TG_UNIMPLEMENTED]
Description: "The URL is a product on the Yandex Market and has an offerid."
Ticket: "COMMERCIAL-128"
Authors: ["hygge", "alejes"]
Responsibles: ["hygge", "alejes"]
# ImplementationTime: "2020-12-04"
}
Factor {
Index: 831
CppName: "FI_SHOP_IN_SHOP_CPA_URL"
Name: "ShopInShopCPAUrl"
Tags: [TG_DYNAMIC, TG_DOC, TG_URL_TEXT, TG_BINARY, TG_OFTEN_ZERO, TG_L2, TG_UNUSED, TG_UNIMPLEMENTED]
Description: "The URL is ShopInShopCPA."
Ticket: "COMMERCIAL-183"
Authors: ["hygge", "alejes"]
Responsibles: ["hygge", "alejes"]
# ImplementationTime: "2020-03-18"
}
Factor {
Index: 832
CppName: "FI_PRODUCT_OFFER_NOT_AVAILABLE"
Name: "ProductOfferNotAvailable"
Ticket: "COMMERCIAL-78"
Authors: ["hygge", "alejes"]
Responsibles: ["hygge", "alejes"]
Description: "At least one offer from the parsed data has an unavailable status."
Tags: [TG_L2, TG_STATIC, TG_OFTEN_ZERO]
ImplementationTime: "2020-04-07"
}
Factor {
Index: 833
CppName: "FI_OWNER_IS_ECOM_PURCHASE"
Name: "OwnerIsEcomPurchase"
Ticket: "COMMERCIAL-124"
Authors: ["hygge", "alejes"]
Responsibles: ["hygge", "alejes"]
Description: "The owner offers an option to purchase goods. (Ecommerce)"
Tags: [TG_OWNER, TG_STATIC, TG_OFTEN_ZERO, TG_UNUSED]
ImplementationTime: "2020-12-17"
}
Factor {
Index: 834
CppName: "FI_OWNER_IS_VISIT_LOGS_PURCHASE"
Name: "OwnerIsVisitLogsPurchase"
Ticket: "COMMERCIAL-124"
Authors: ["hygge", "alejes"]
Responsibles: ["hygge", "alejes"]
Description: "The owner offers an option to purchase goods, based on visit logs."
Tags: [TG_HOST, TG_STATIC, TG_OFTEN_ZERO, TG_UNUSED, TG_UNIMPLEMENTED]
}
Factor {
Index: 835
CppName: "FI_NAV_PARASITES"
Name: "NavParasites"
Ticket: "FACTOR-2471"
Authors: ["hygge", "alejes", "polandr"]
Responsibles: ["hygge", "alejes"]
Description: "Dssm probability prediction by url + title that the document is a parasite."
Tags: [TG_L2, TG_NEURAL, TG_URL_TEXT, TG_STATIC, TG_NOT_01, TG_UNUSED, TG_ALLOW_USE_FOR_SPAM_FORMULAS]
ImplementationTime: "2022-01-01"
MinValue: -0.5
MaxValue: 1.5
}
Factor {
Index: 836
CppName: "FI_OFFER_AVAILABILITY_IS_SET_UP"
Name: "OfferAvailabilityIsSetUp"
Ticket: "COMMERCIAL-186"
Authors: ["hygge", "alejes"]
Responsibles: ["hygge", "alejes"]
Description: "The offer from the new parser has the “PartnerOfferContent available” field set."
Tags: [TG_L2, TG_STATIC, TG_OFTEN_ZERO, TG_UNUSED, TG_UNIMPLEMENTED]
}
Factor {
Index: 837
CppName: "FI_OFFER_AVAILABILITY"
Name: "OfferAvailability"
Ticket: "COMMERCIAL-186"
Authors: ["hygge", "alejes"]
Responsibles: ["hygge", "alejes"]
Description: "The PartnerOfferContent available == true based on the offer from the new parser"
Tags: [TG_L2, TG_STATIC, TG_OFTEN_ZERO, TG_UNUSED, TG_UNIMPLEMENTED]
}
Factor {
Index: 838
CppName: "FI_URL_CLICKS_MAX_GEO_CITY_FRC_WEIGHT"
Name: "URLClicksMaxGeoCityFRCWeight"
Ticket: "FACTOR-36"
Wiki: "<http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/URLClicksMaxGeoCityFRC>"
Tags: [TG_DOC, TG_STATIC, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_L2, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_90D, TG_USERFEAT_GEOCLICKS]
Description: "Normalized corrected clicks count by query with user's city(gc=) mentioned"
Authors: "esoloviev"
Responsibles: ["tarum", "niknik"]
}
Factor {
Index: 839
CppName: "FI_URL_CLICKS_MAX_GEO_CITY_FRC_RATIO"
Name: "URLClicksMaxGeoCityFRCRatio"
Ticket: "FACTOR-36"
Wiki: "<http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/URLClicksMaxGeoCityFRC>"
Tags: [TG_DOC, TG_DYNAMIC, TG_LOCALIZED_CITY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_L2, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_90D, TG_USERFEAT_GEOCLICKS]
Description: "Normalized corrected clicks maximum ratio by query with user's city(gc=) mentioned"
Authors: "esoloviev"
Responsibles: ["tarum", "niknik"]
}
Factor {
Index: 840
CppName: "FI_URL_CLICKS_MAX_ALIEN_GEO_CITY_FRC_RATIO"
Name: "URLClicksMaxGeoAlienCityFRCRatio"
Ticket: "FACTOR-36"
Wiki: "<http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/URLClicksMaxGeoCityFRC>"
Tags: [TG_DOC, TG_DYNAMIC, TG_LOCALIZED_CITY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_L2, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_90D, TG_USERFEAT_GEOCLICKS]
Description: "Normalized corrected clicks maximum ratio by query with not user's city(gc=) mentioned"
Authors: "esoloviev"
Responsibles: ["tarum", "niknik"]
}
Factor {
Index: 841
CppName: "FI_FAST_MX"
Name: "FastMx"
Ticket: "FACTOR-271"
Wiki: "<http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/FastMx>"
Tags: [TG_DOC, TG_DYNAMIC, TG_TRANS, TG_UNUSED]
Authors: ["vmordovin", "sisoid"]
Responsibles: ["vmordovin", "sisoid"]
}
Factor {
Index: 842
CppName: "FI_PURCHASE_TOTAL_PREDICT"
Name: "PurchaseTotalPredict"
Ticket: "COMMERCIAL-190"
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_USER, TG_L2, TG_QUERY_DETECTOR_PREDICT, TG_NOT_01, TG_UNUSED, TG_UNIMPLEMENTED]
Description: "The value of PurchaseTotalPredict calculated in the Hippo (The name of the algorithm)."
Authors: ["alejes", "hygge"]
Responsibles: ["alejes", "hygge"]
MinValue: -10
MaxValue: 10
}
Factor {
Index: 843
CppName: "FI_SERP_SUMMARY_SURPLUS_PREDICT"
Name: "SerpSummarySurplusPredict"
Ticket: "COMMERCIAL-190"
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_USER, TG_L2, TG_QUERY_DETECTOR_PREDICT, TG_UNUSED, TG_UNIMPLEMENTED]
Description: "The SerpSummarySurplusPredict value calculated in the Hippo (The name of the algorithm)."
Authors: ["alejes", "hygge"]
Responsibles: ["alejes", "hygge"]
}
Factor {
Index: 844
CppName: "FI_YABAR_URL_REVISITS"
Name: "YabarUrlRevisits"
Wiki: "<http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/Revisits>"
Ticket: "FACTOR-186"
Tags: [TG_STATIC, TG_DOC, TG_USER, TG_BROWSER, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_REVISITS]
Description: "Does the user return to this URL? "
Authors: ["shpilman", "atolstikov"]
Responsibles: ["atolstikov", "tarum", "niknik"]
}
Factor {
Index: 845
CppName: "FI_REQUEST_WITH_120_D3_CLICK_PART_PREDICT"
Name: "RequestWith120D3ClickPartPredict"
Ticket: "COMMERCIAL-190"
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_USER, TG_L2, TG_QUERY_DETECTOR_PREDICT, TG_NOT_01, TG_UNUSED, TG_UNIMPLEMENTED]
Description: "The value of RequestWith120D3ClickPartPredict calculated in the Hippo (The name of the algorithm)."
Authors: ["alejes", "hygge"]
Responsibles: ["alejes", "hygge"]
MinValue: -10
MaxValue: 110
}
Factor {
Index: 846
CppName: "FI_QUERY_NAV_PARASITES_DETECTOR_PREDICT"
Name: "QueryNavParasitesDetectorPredict"
Ticket: "COMMERCIAL-190"
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_USER, TG_L2, TG_QUERY_DETECTOR_PREDICT, TG_UNUSED]
Description: "The value of the parasite request detector calculated in the Hippo (The name of the algorithm)."
Authors: ["alejes", "hygge", "i-vainn"]
Responsibles: ["alejes", "hygge"]
ImplementationTime: "2022-01-01"
}
Factor {
Index: 847
CppName: "FI_BROWSER_HOST_CNT_DWELL_TIME_LOG"
Name: "BrowserHostCntDwellTimeLog"
Group: "RegHostStatic"
Wiki: "<https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/YabarUrlVisitsRegions>"
Ticket: "FACTOR-324"
Tags: [TG_STATIC, TG_USER, TG_HOST, TG_BROWSER, TG_LOCALIZED_COUNTRY, TG_L2, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_90D, TG_USERFEAT_REG_SITE_BROWSER]
Countries: CNT_RELEV
Description: "Logarithm of the average time spent by a user on a host with localization by country; calculated according to Yabar logs"
Authors: ["gotmanov", "vvp", "esoloviev"]
Responsibles: ["gotmanov", "alsafr"]
}
Factor {
Index: 848
CppName: "FI_BROWSER_HOST_DWELL_TIME_REGION_FRC"
Name: "BrowserHostDwellTimeRegionFrc"
Group: "RegHostStatic"
Wiki: "<https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/YabarUrlVisitsRegions>"
Ticket: "FACTOR-324"
Tags: [TG_STATIC, TG_USER, TG_HOST, TG_BROWSER, TG_LOCALIZED_REGION, TG_L2, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_90D, TG_USERFEAT_REG_SITE_BROWSER]
Description: "Ratio of dwell time on a host in a given region to dwell time on a host across all regions"
Authors: ["gotmanov", "vvp", "esoloviev"]
Responsibles: ["gotmanov"]
}
Factor {
Index: 849
CppName: "FI_BROWSER_URL_DWELL_TIME_REGION_FRC"
Name: "BrowserUrlDwellTimeRegionFrc"
Group: "RegDocStatic"
Wiki: "<https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/YabarUrlVisitsRegions>"
Ticket: "FACTOR-324"
Tags: [TG_STATIC, TG_USER, TG_DOC, TG_BROWSER, TG_LOCALIZED_REGION, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_90D, TG_USERFEAT_REG_SITE_BROWSER]
Description: "Ratio of dwell time on a page in a given region to dwell time on a page across all regions"
Authors: ["gotmanov", "vvp", "esoloviev"]
Responsibles: ["gotmanov"]
}
Factor {
Index: 850
CppName: "FI_BROWSER_BOOKMARKS_URL"
Name: "BrowserBookmarksUrl"
Ticket: "FACTOR-310"
Wiki: "<https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/BrowserBookmarks>"
Tags: [TG_STATIC, TG_USER, TG_BROWSER, TG_DOC, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_NN_OVER_FEATURES_USE]
Description: "The more users add this URL to bookmarks, the higher the factor value"
Authors: ["pavelgur", "vvp"]
Responsibles: ["pavelgur", "tarum", "niknik"]
}
Factor {
Index: 851
CppName: "FI_SOS_DSSM"
Name: "SosDssm"
Ticket: "FACTOR-2475"
Authors: ["hygge", "alejes", "anrodigina", "hommforever"]
Responsibles: ["hygge", "alejes"]
Description: "Sos.dssm model prediction by url + title."
Tags: [TG_L2, TG_NEURAL, TG_URL_TEXT, TG_STATIC, TG_NOT_01, TG_USED_IN_CONF_REARR]
MinValue: -1
MaxValue: 1
ImplementationTime: "2021-03-31"
}
Factor {
Index: 852
CppName: "FI_MED_DSSM"
Name: "MedDssm"
Ticket: "FACTOR-2475"
Authors: ["hygge", "alejes", "anrodigina", "hommforever"]
Responsibles: ["hygge", "alejes"]
Description: "Predicting med.dssm model by url + title."
Tags: [TG_L2, TG_NEURAL, TG_URL_TEXT, TG_STATIC, TG_NOT_01, TG_USED_IN_CONF_REARR]
MinValue: -10
MaxValue: 10
ImplementationTime: "2021-03-31"
}
Factor {
Index: 853
CppName: "FI_FIN_LAW_DSSM"
Name: "FinLawDssm"
Ticket: "FACTOR-2475"
Authors: ["hygge", "alejes", "anrodigina", "hommforever"]
Responsibles: ["hygge", "alejes"]
Description: "Predict fin_law.dssm model by url + title."
Tags: [TG_L2, TG_NEURAL, TG_URL_TEXT, TG_STATIC, TG_UNUSED, TG_UNIMPLEMENTED]
}
Factor {
Index: 854
CppName: "FI_WIKI_INFOBOX"
Name: "WikiInfobox"
Ticket: "FACTOR-85"
Wiki: "<https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/WikiInfobox>"
Tags: [TG_STATIC, TG_DOC, TG_WIKIPEDIA, TG_USER, TG_LINK_GRAPH, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_1D, TG_NN_OVER_FEATURES_USE]
Description: "There is a link to this URL from Infoboxes on Wikipedia."
Authors: ["dimavin", "smikler"]
Responsibles: ["dimavin", "smikler", "tarum", "niknik"]
}
Factor {
Index: 855
CppName: "FI_CRUELTY_DSSM"
Name: "CrueltyDssm"
Ticket: "FACTOR-2476"
Authors: ["hygge", "alejes", "anrodigina", "hommforever"]
Responsibles: ["hygge", "alejes"]
Description: "Predict cruelty.dssm model by url + title."
Tags: [TG_L2, TG_NEURAL, TG_URL_TEXT, TG_STATIC, TG_UNUSED, TG_USED_IN_CONF_REARR, TG_NOT_01]
MinValue: -10
MaxValue: 10
}
Factor {
Index: 856
CppName: "FI_HALF_ECOM_PREDICT"
Name: "HalfEcomPredict"
Ticket: "COMMERCIAL-190"
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_USER, TG_L2, TG_QUERY_DETECTOR_PREDICT, TG_UNUSED, TG_UNIMPLEMENTED]
Description: "The value of HalfEcomPredict calculated in the Hippo (The name of the algorithm)."
Authors: ["alejes", "hygge"]
Responsibles: ["alejes", "hygge"]
}
Factor {
Index: 857
CppName: "FI_PREFIX_SUFFIX_MAX_CLICK_PERCENT_REG"
Name: "PrefixSuffixMaxClickPercentReg"
Ticket: "FACTOR-396"
Wiki: "<http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/regexmaxclickpercent>"
Group: "Regex"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_L2, TG_DEPRECATED]
Countries: CNT_RELEV
Description: "This factor is similar to RegexMaxClickPercentReg, but calculated from prefix-suffix generalization."
Authors: ["smikler"]
Responsibles: ["smikler", "tsimkha", "yustuken"]
}
Factor {
Index: 858
CppName: "FI_PREFIX_SUFFIX_MAX_CLICK_PERCENT_YABAR_REG"
Name: "PrefixSuffixMaxClickPercentYabarReg"
Ticket: "FACTOR-396"
Wiki: "<http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/regexmaxclickpercent>"
Group: "Regex"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_BROWSER, TG_USER_SEARCH, TG_USER_EXT_DATA, TG_L2, TG_DEPRECATED]
Countries: CNT_RELEV
Description: "This factor similar to RegexMaxClickPercentYabarReg, but calculated from prefix-suffix generalization."
Authors: ["smikler"]
Responsibles: ["smikler", "tsimkha", "yustuken"]
}
Factor {
Index: 859
CppName: "FI_DSSM_NAVIGATION_L2"
Name: "DssmNavigationL2"
Tags: [TG_DYNAMIC, TG_DOC, TG_USER, TG_USER_SEARCH, TG_URL_TEXT, TG_DOC_TEXT, TG_NEURAL, TG_L2]
Description: "Query-document navigation model."
UseArtifact: {Name: "DssmNavigationL2"}
Ticket: "SEARCH-10934"
Authors: ["hygge", "alejes", "arrin"]
Responsibles: ["hygge", "alejes"]
ImplementationTime: "2021-03-31"
}
Factor {
Index: 860
CppName: "FI_YABAR_HOST_SURFTR_NODES_HANGS_GRADIENT"
Name: "YabarHostSurfTrNdHgGr"
Ticket: "FACTOR-112"
Wiki: "<http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/SurfTr-Hangs>"
Tags: [TG_STATIC, TG_HOST, TG_USER, TG_BROWSER, TG_USER_SEARCH, TG_L2, TG_DEPRECATED]
Description: "Average angle of inclination in the apex-hovering plane"
Authors: ["atolstikov", "osenzen"]
Responsibles: "atolstikov"
}
Factor {
Index: 861
CppName: "FI_QUERY_URL_CORRECTED_CTR_XFACTOR"
Name: "QueryUrlCorrectedCtrXfactor"
Ticket: "FACTOR-397"
Wiki: "<https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/QueryUrlCorrectedCtrXfactor>"
Tags: [TG_DYNAMIC, TG_DOC, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_LOCALIZED_COUNTRY, TG_COLLABORATED, TG_USER, TG_L2, TG_DEPRECATED, TG_REMOVED]
Countries: [CNT_ALL, CNT_TR]
Description: "Query-URL factor. Value - the result of collaborative data filtering for the QueryUrlCorrectedCtr factor"
Authors: ["avatar", "vvp", "alsafr"]
Responsibles: ["avatar", "alsafr"]
}
Factor {
Index: 862
CppName: "FI_FULL_MATRIX_NET"
Name: "FullMatrixNet"
Tags: [TG_DOC, TG_DYNAMIC, TG_TRANS, TG_UNUSED]
Ticket: "SAASSUP-3320"
Authors: ["derrior"]
Responsibles: ["derrior"]
Description: "The MatrixNet value of the slow ranking model."
}
Factor {
Index: 863
CppName: "FI_FAST_MATRIX_NET"
Name: "FastMatrixNet"
Tags: [TG_DOC, TG_DYNAMIC, TG_TRANS, TG_UNUSED]
Ticket: "SAASSUP-3320"
Authors: ["derrior"]
Responsibles: ["derrior"]
Description: "The MatrixNet value of the fast ranking model."
}
Factor {
Index: 864
CppName: "FI_FILTER_MATRIX_NET"
Name: "FilterMatrixNet"
Tags: [TG_DOC, TG_DYNAMIC, TG_TRANS, TG_UNUSED]
Ticket: "SAASSUP-3320"
Authors: ["derrior"]
Responsibles: ["derrior"]
Description: "The MatrixNet value of the filtering model."
}
Factor {
Index: 865
CppName: "FI_SMALL_WINDOW_ATTENUATION_Q"
Name: "SmallWindowAttenuationQ"
Ticket: "FACTOR-441"
Wiki: "<http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/obshayaformula/tekushhiekomponenty/SmallWindow>"
Group: "CombinedAbs"
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_DEPRECATED]
Authors: "alsafr"
Responsibles: "alsafr"
}
Factor {
Index: 866
CppName: "FI_QUERY_DOC_TITLE_RANGES_MATCHING_SCORE"
Name: "QueryDocTitleRangesMatchingScore"
Ticket: "FACTOR-353"
Wiki: "<https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/QueryDocTitleRanges>"
Tags: [TG_DYNAMIC, TG_DOC, TG_DOC_TEXT, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "This factors is calculated based on the text of the query and the title (title) of the document."
Authors: ["gotmanov", "magaz"]
Responsibles: ["gotmanov", "magaz"]
}
Factor {
Index: 867
CppName: "FI_FULL_POLYNOM"
Name: "FullPolynom"
Tags: [TG_DOC, TG_DYNAMIC, TG_UNUSED, TG_TRANS]
Ticket: "SAAS-6009"
Authors: ["derrior"]
Responsibles: ["derrior"]
Description: "The Polynom value of the slow ranking model."
}
Factor {
Index: 868
CppName: "FI_FAST_POLYNOM"
Name: "FastPolynom"
Tags: [TG_DOC, TG_DYNAMIC, TG_UNUSED, TG_TRANS]
Ticket: "SAAS-6009"
Authors: ["derrior"]
Responsibles: ["derrior"]
Description: "The Polynom value of the fast ranking model."
}
Factor {
Index: 869
CppName: "FI_FILTER_POLYNOM"
Name: "FilterPolynom"
Tags: [TG_DOC, TG_DYNAMIC, TG_UNUSED, TG_TRANS]
Ticket: "SAAS-6009"
Authors: ["derrior"]
Responsibles: ["derrior"]
Description: "The Polynom value of the filtering ranking model."
}
Factor {
Index: 870
CppName: "FI_IS_TRANSLATED_DOCUMENT"
Name: "IsTranslatedDocument"
Tags: [TG_DOC, TG_STATIC, TG_L2, TG_UNUSED, TG_UNIMPLEMENTED]
Ticket: "MT-14803"
Authors: ["bvshuryg"]
Responsibles: ["bvshuryg"]
Description: "There is a sign of usage of machine translation for the document."
}
Factor {
Index: 871
CppName: "FI_MED_DSSM_WITH_TRASH"
Name: "MedDssmWithTrash"
Ticket: "SENS-177"
Authors: ["hygge", "alejes", "anrodigina", "hommforever", "nenashevna"]
Responsibles: ["hygge", "alejes"]
Description: "Prediction med_with_trash.dssm (med. document model with adding trash to lern) model based on url + title."
MinValue: -2.0
MaxValue: 2.0
Tags: [TG_L2, TG_NEURAL, TG_URL_TEXT, TG_STATIC, TG_UNUSED, TG_UNIMPLEMENTED, TG_NOT_01]
}
Factor {
Index: 872
CppName: "FI_FIN_LAW_DSSM_WITH_TRASH"
Name: "FinLawDssmWithTrash"
Ticket: "SENS-177"
Authors: ["hygge", "alejes", "anrodigina", "hommforever", "nenashevna"]
Responsibles: ["hygge", "alejes"]
Description: "Prediction fin_law_with_trash.dssm (fin-jur. document model with adding trash to lern) model based on url + title."
MinValue: -2.0
MaxValue: 2.0
Tags: [TG_L2, TG_NEURAL, TG_URL_TEXT, TG_STATIC, TG_UNUSED, TG_NOT_01, TG_USED_IN_CONF_REARR]
}
Factor {
Index: 873
CppName: "FI_FIO_FROM_ORIGINAL_REQUEST_BODY_MIN_WINDOW_SIZE"
Name: "FioFromOriginalRequestBodyMinWindowSize"
Ticket: "SEARCHSPEC-94"
Description: "This factor is based on full name from the original query. Calculated based on the content of the document. The minimum size of the step that contains all query words. Normalized to the number of words in the query."
Tags: [TG_DOC, TG_DOC_TEXT, TG_UNDOCUMENTED, TG_TEXT_MACHINE]
ImplementationTime: "2021-08-30"
}
Factor {
Index: 874
CppName: "FI_FIO_FROM_ORIGINAL_REQUEST_TEXT_COSINE_MATCH_MAX_PREDICTION"
Name: "FioFromOriginalRequestTextCosineMatchMaxPrediction"
Ticket: "SEARCHSPEC-94"
Description: This factor is based on full name from the original query. Algorithm: CosineMatchMaxPrediction."
Tags: [TG_DOC, TG_DOC_TEXT, TG_UNDOCUMENTED, TG_UNIMPLEMENTED, TG_TEXT_MACHINE]
}
Factor {
Index: 875
CppName: "FI_ALL_FIO_FROM_ORIGINAL_REQUEST_ALL_MAX_F_BODY_CHAIN0_WCM"
Name: "AllFioFromOriginalRequestAllMaxFBodyChain0Wcm"
Ticket: "SEARCHSPEC-94"
Description: "This factor is based on all full names from the original query. Aggregation by all extensions. Type of extension aggregation: highest factor value; Calculated based on document content. Algorithm: Chain0Wcm."
Tags: [TG_DOC, TG_DOC_TEXT, TG_UNDOCUMENTED, TG_UNIMPLEMENTED, TG_TEXT_MACHINE]
}
Factor {
Index: 876
CppName: "FI_ALL_FIO_FROM_ORIGINAL_REQUEST_ALL_MAX_F_BODY_MIN_WINDOW_SIZE"
Name: "AllFioFromOriginalRequestAllMaxFBodyMinWindowSize"
Ticket: "SEARCHSPEC-94"
Description: "This factor is based on all full names from the original query. Aggregation over all extensions. Type of extension aggregation: highest factor value; calculated based on the contents of the document. Minimum step size for all words in the query to be included, normalized by the number of words in the query."
Tags: [TG_DOC, TG_DOC_TEXT, TG_UNDOCUMENTED, TG_UNIMPLEMENTED, TG_TEXT_MACHINE]
}
Factor {
Index: 877
CppName: "FI_SP_AVG_CLICK_FRC_SYN_REG"
Name: "SamplePeriodClickFrcSyn"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_SYNNORM, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_SAMPLE_PERIOD, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_USF_SAMPLE_PERIOD, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Description: "The percentage of the clicks on the URL in total number of clicked URLs per session (synnorm) for the given query."
Authors: "monnoroch"
Responsibles: ["monnoroch", "alsafr", "tarum", "niknik"]
Wiki: "<https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/sampleperiod>"
Ticket: "FACTOR-442"
}
Factor {
Index: 878
CppName: "FI_SP_AVG_TOTAL_FRC_SYN_REG"
Name: "SamplePeriodDayFrcSyn"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_SYNNORM, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_SAMPLE_PERIOD, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_USF_SAMPLE_PERIOD, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Description: "The average percentage of the clicks on the given URL for athe given query among all clicks for the query (synnorm) during the day."
Authors: "monnoroch"
Responsibles: ["monnoroch", "alsafr", "tarum", "niknik"]
Wiki: "<https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/sampleperiod>"
Ticket: "FACTOR-442"
}
Factor {
Index: 879
CppName: "FI_SP_AVG_TOTAL_FRC_REG"
Name: "SamplePeriodDayFrc"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_SAMPLE_PERIOD, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_USF_SAMPLE_PERIOD, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Description: "The average percentage of clicks on the given URL for a given query among all clicks on the query (qnorm) during the day."
Authors: "monnoroch"
Responsibles: ["monnoroch", "alsafr", "tarum", "niknik"]
Wiki: "<https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/sampleperiod>"
Ticket: "FACTOR-442"
}
Factor {
Index: 880
CppName: "FI_QI_QUERY_URL_CORRECTED_CTR_XFACTOR"
Name: "QiQueryUrlCorrectedCtrXfactor"
Group: "QI"
Ticket: "FACTOR-306"
Wiki: "<https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/qiuserdata>"
Tags: [TG_DYNAMIC, TG_DOC, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_LOCALIZED_COUNTRY, TG_USER_EXT_DATA, TG_COLLABORATED, TG_USER, TG_L2, TG_DEPRECATED, TG_REMOVED]
Countries: [CNT_ALL, CNT_TR]
Description: "QI version of factor 861. MaxValue over the set of popular similar queries."
Authors: "tsimkha"
Responsibles: ["smikler", "tsimkha"]
}
Factor {
Index: 881
CppName: "FI_QI_QUERY_URL_ISBM_CTR_REG"
Name: "QiQueryURLISBMCTRReg"
Group: "QI"
Wiki: "<https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/qiuserdata>"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_REGION, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_L2, TG_DEPRECATED]
Ticket: "FACTOR-306"
Description: "QI version of factor 798. MaxValue over the set of popular similar queries."
Authors: "tsimkha"
Responsibles: ["smikler", "tsimkha"]
}
Factor {
Index: 882
CppName: "FI_ALL_FIO_FROM_ORIGINAL_REQUEST_ALL_MAX_F_TEXT_COSINE_MATCH_MAX_PREDICTION"
Name: "AllFioFromOriginalRequestAllMaxFTextCosineMatchMaxPrediction"
Ticket: "SEARCHSPEC-94"
Description: "The factor is based on all Full names from the original query, aggregated across all extensions. The aggregation type for extensions is the maximum value of the factor, calculated based on the document text. The algorithm used is CosineMatchMaxPrediction."
Tags: [TG_DOC, TG_DOC_TEXT, TG_UNDOCUMENTED, TG_UNIMPLEMENTED, TG_TEXT_MACHINE] }
Factor {
Index: 883
CppName: "FI_DSSM_PAGE_QUALITY"
Name: "DssmPageQuality"
Ticket: "SEARCH-11378, SEARCHSPEC-172"
Authors: ["jullak"]
Responsibles: ["nenashevna", "hommforever", "jullak"]
Description: "Dssm, predicting the page quality rating of the document."
Tags: [TG_DEPRECATED, TG_NEURAL, TG_STATIC, TG_URL_TEXT, TG_DOC]
ImplementationTime: "2021-11-25"
}
Factor {
Index: 884
CppName: "FI_HAS_TURBO_ECOM"
Name: "HasTurboEcom"
Tags: [TG_DOC, TG_STATIC, TG_BINARY, TG_OFTEN_ZERO, TG_META_OVERWRITE, TG_UNUSED, TG_DATA_FROM_SAASKV, TG_UNIMPLEMENTED]
Ticket: "SEARCHSPAM-15910"
Authors: ["bikulov"]
Responsibles: ["bikulov", "ulyanov"]
}
Factor {
Index: 885
CppName: "FI_MEMORANDUM_URL_TYPE"
Name: "MemorandumUrlType"
Tags: [TG_DOC, TG_STATIC, TG_OFTEN_ZERO, TG_UNUSED, TG_UNIMPLEMENTED]
Ticket: "CONTENTQUALITY-169"
Authors: ["makkolts"]
Responsibles: ["makkolts", "sdormidontov"]
}
Factor {
Index: 886
CppName: "FI_SP_AVG_TOTAL_FRC_XFACTOR_REG"
Name: "SamplePeriodDayFrcXfactor"
Ticket: "FACTOR-506"
Wiki: "<https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/sampleperiodXfactor>"
Tags: [TG_DYNAMIC, TG_DOC, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_LOCALIZED_COUNTRY, TG_COLLABORATED, TG_USER, TG_L2, TG_DEPRECATED, TG_REMOVED]
Countries: [CNT_RU]
Description: "Query+URL factor. Value - result of collaborative filtering of data for SamplePeriodDayFrc factor."
Authors: ["avatar", "monnoroch", "alsafr"]
Responsibles: ["avatar", "monnoroch"]
}
Factor {
Index: 887
CppName: "FI_FAST_FILTER_MATRIX_NET"
Name: "FastFilterMatrixNet"
Tags: [TG_DOC, TG_DYNAMIC, TG_UNUSED, TG_TRANS]
Ticket: "SAAS-5758"
Authors: ["odinmillion"]
Responsibles: ["odinmillion"]
Description: "The value of MatrixNet is the result of a fast filtering model in machine learning."
}
Factor {
Index: 888
CppName: "FI_FAST_FILTER_POLYNOM"
Name: "FastFilterPolynom"
Tags: [TG_DOC, TG_DYNAMIC, TG_UNUSED, TG_TRANS]
Ticket: "SAAS-5758"
Authors: ["odinmillion"]
Responsibles: ["odinmillion"]
Description: "The value of Polynom in a fast ranking filtering model."
}
Factor {
Index: 889
CppName: "FI_QI_SP_AVG_TOTAL_FRC_REG"
Name: "QiSamplePeriodDayFrc"
Group: "QI"
Wiki: "<https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/sampleperiod>"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_REGION, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_L2, TG_DEPRECATED]
Ticket: "FACTOR-442"
Description: "QI version of factor 879."
Authors: "monnoroch"
Responsibles: ["monnoroch", "tsimkha"]
}
Factor {
Index: 890
CppName: "FI_META_MATRIX_NET"
Name: "MetaMatrixNet"
Tags: [TG_DOC, TG_DYNAMIC, TG_TRANS, TG_UNUSED]
Ticket: "SAASSUP-3741"
Authors: ["odinmillion"]
Responsibles: ["odinmillion"]
Description: "The value of MatrixNet on the meta level."
}
Factor {
Index: 891
CppName: "FI_META_POLYNOM"
Name: "MetaPolynom"
Tags: [TG_DOC, TG_DYNAMIC, TG_TRANS, TG_UNUSED]
Ticket: "SAASSUP-3741"
Authors: ["odinmillion"]
Responsibles: ["odinmillion"]
Description: "The value of Polynom on the meta."
}
Factor {
Index: 892
CppName: "FI_SHORT_VIDEO"
Name: "ShortVideo"
Tags: [TG_DOC, TG_STATIC, TG_URL_TEXT, TG_BINARY, TG_OFTEN_ZERO, TG_L2, TG_UNUSED, TG_UNIMPLEMENTED]
Ticket: "SEARCHPLAY-24"
Authors: ["bbetrozova"]
Responsibles: ["bbetrozova", "alejes"]
Description: "The document is a short video (TikTok, Reels, Shorts)."
}
Factor {
Index: 893
CppName: "FI_TELEGRAM_CHANNEL_WEB"
Name: "TelegramChannelWebFormat"
Tags: [TG_DOC, TG_STATIC, TG_URL_TEXT, TG_BINARY, TG_OFTEN_ZERO, TG_L2, TG_UNUSED, TG_UNIMPLEMENTED]
Ticket: "SEARCHPLAY-49"
Authors: ["bbetrozova"]
Responsibles: ["bbetrozova", "alejes"]
Description: "The document is a Telegram channel in a web format." }
Factor {
Index: 894
CppName: "FI_TELEGRAM_POST"
Name: "TelegramPost"
Tags: [TG_DOC, TG_STATIC, TG_URL_TEXT, TG_BINARY, TG_OFTEN_ZERO, TG_L2, TG_UNUSED, TG_UNIMPLEMENTED]
Ticket: "SEARCHPLAY-49"
Authors: ["bbetrozova"]
Responsibles: ["bbetrozova", "alejes"]
Description: "The document is a post or message on a Telegram channel."
}
Factor {
Index: 895
CppName: "FI_CORRECTED_CTR_ANNOTATION_MATCH_PREDICTION"
Name: "CorrectedCtrAnnotationMatchPrediction"
Ticket: "FACTOR-468"
Group: "Annotation"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_FILTER, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_1832D, TG_USERFEAT_SEARCH_DWELL_TIME, TG_USERFEAT_USF, TG_FORMULA_2245_DEP_2, TG_DEPRECATED]
Description: ""CorrectedCtrReg" is a factor in an annotated index and "AnnotationMatchPrediction" is another factor in the same index."
Authors: ["alsafr", "smikler"]
Responsibles: "smikler"
}
Factor {
Index: 896
CppName: "FI_CORRECTED_CTR_QUERY_MATCH_PREDICTION"
Name: "CorrectedCtrQueryMatchPrediction"
Ticket: "FACTOR-468"
Group: "Annotation"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_FILTER, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_1832D, TG_USERFEAT_SEARCH_DWELL_TIME, TG_USERFEAT_USF, TG_FORMULA_2245_DEP_2, TG_DEPRECATED]
Description: "CorrectedCtrReg is a factor in the annotation index, with a QueryMatchPrediction factor."
Authors: ["alsafr", "smikler"]
Responsibles: "smikler"
}
Factor {
Index: 897
CppName: "FI_CORRECTED_CTR_VALUE_WCM_AVG"
Name: "CorrectedCtrValueWcmAvg"
Ticket: "FACTOR-468"
Group: "Annotation"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_FILTER, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_1832D, TG_USERFEAT_SEARCH_DWELL_TIME, TG_USERFEAT_USF, TG_FORMULA_2245_DEP_2, TG_DEPRECATED]
Description: "The CorrectedCtrReg factor in the annotation index and the ValueWcmAvg factor."
Authors: ["alsafr", "smikler"]
Responsibles: "smikler"
}
Factor {
Index: 898
CppName: "FI_CORRECTED_CTR_BM15_V4_K5"
Name: "CorrectedCtrBm15V4K5"
Ticket: "FACTOR-468"
Group: "Annotation"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_FILTER, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_1832D, TG_USERFEAT_SEARCH_DWELL_TIME, TG_USERFEAT_USF, TG_FORMULA_2245_DEP_2, TG_DEPRECATED]
Description: "The CorrectedCtrReg factor in the annotation index, factor Bm15V4K5."
Authors: ["alsafr", "smikler"]
Responsibles: "smikler"
}
Factor {
Index: 899
CppName: "FI_IS_NOT_CGI"
Name: "IsNotCgi"
Ticket: "FACTOR-575"
Tags: [TG_STATIC, TG_URL_TEXT, TG_DOC, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: "Does the URL contain '?' symbol?. It is equal to zero if the URL does not have CGI parameters (more precisely: all duplicates have a '?' symbol in the URL)."
Authors: "ilnurkh"
Responsibles: "ilnurkh"
}
Factor {
Index: 900
CppName: "FI_ALICE_CLICK_DSSM"
Name: "AliceClickDssm"
Tags: [TG_DYNAMIC, TG_DOC, TG_USER, TG_USER_SEARCH, TG_URL_TEXT, TG_DOC_TEXT, TG_DOC_CONTENT, TG_NEURAL, TG_UNDOCUMENTED, TG_UNUSED, TG_ALICE_MUSIC, TG_RTMODELS_SERVICE, TG_ALLOW_USE_FOR_ALICE]
Description: "DSSM-based click prediction using data specific to Alisa (voice search)."
Ticket: "SEARCHSPEC-132"
Authors: "an-to-nen-ko"
Responsibles: "an-to-nen-ko"
ImplementationTime: "2021-11-27"
}
Factor {
Index: 901
CppName: "FI_TEL_FULL_ATTRIBUTE_TEXT_BOCM15_K001"
Name: "TelFullAttributeTextBocm15K001"
Ticket: "SEARCHPLAY-70"
Description: "The factor is based on phone attributes tel_full from the original query. Text Document. The Bocm15 word weight aggregation algorithm. Normalization coefficient 0.01."
Tags: [TG_DOC, TG_DOC_TEXT, TG_TEXT_MACHINE, TG_UNDOCUMENTED, TG_DYNAMIC]
Authors: "ilnurkh"
Responsibles: "ilnurkh"
ImplementationTime: "2022-02-09"
}
Factor {
Index: 902
CppName: "FI_REMOVED_902"
Name: "Removed_902"
Tags: [TG_REMOVED]
}
Factor {
Index: 903
CppName: "FI_SAMPLE_PERIOD_DAY_FRC_QUERY_MATCH_PREDICTION"
Name: "SamplePeriodDayFrcQueryMatchPrediction"
Ticket: "FACTOR-605"
Wiki: "<https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/sampleperiod>"
Group: "Annotation"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: "SamplePeriodDayFrc is a factor in the annotation index, the QueryMatchPrediction factor."
Authors: "pavelgur"
Responsibles: ["smikler", "yustuken", "diver"]
}
Factor {
Index: 904
CppName: "FI_SAMPLE_PERIOD_DAY_FRC_ANNOTATION_MATCH_PREDICTION"
Name: "SamplePeriodDayFrcAnnotationMatchPrediction"
Ticket: "FACTOR-605"
Wiki: "<https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/sampleperiod>"
Group: "Annotation"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: "SamplePeriodDayFrc is a factor in the annotation index, AnnotationMatchPrediction factor."
Authors: "pavelgur"
Responsibles: ["smikler", "yustuken", "diver"]
}
Factor {
Index: 905
CppName: "FI_ONE_CLICK_QUERY_MATCH_PREDICTION"
Name: "OneClickQueryMatchPrediction"
Group: "Annotation"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: "OneClick factor in the annotation index, QueryMatchPrediction factor."
Authors: ["alsafr", "pavelgur"]
Responsibles: ["smikler", "yustuken", "diver"]
}
Factor {
Index: 906
CppName: "FI_ONE_CLICK_ANNOTATION_MATCH_PREDICTION"
Name: "OneClickAnnotationMatchPrediction"
Group: "Annotation"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: "OneClick factor in the annotational index, AnnotationMatchPrediction factor."
Authors: ["alsafr", "pavelgur"]
Responsibles: ["smikler", "yustuken", "diver"]
}
Factor {
Index: 907
CppName: "FI_ONE_CLICK_BM15_AK4"
Name: "OneClickBm15AK4"
Group: "Annotation"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: "OneClick factor in the annotation index, factor Bm15AK4."
Authors: ["alsafr", "pavelgur"]
Responsibles: ["smikler", "yustuken", "diver"]
}
Factor {
Index: 908
CppName: "FI_ONE_CLICK_BOCM_WEIGHTED_W1K3"
Name: "OneClickBocmWeightedW1K3"
Group: "Annotation"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: "OneClick factor in the annotation index, BocmWeightedW1K3 factor."
Authors: ["alsafr", "pavelgur"]
Responsibles: ["smikler", "yustuken", "diver"]
}
Factor {
Index: 909
CppName: "FI_LONG_CLICK_QUERY_MATCH_PREDICTION"
Name: "LongClickQueryMatchPrediction"
Group: "Annotation"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: "LongClick factor in the annotation index, QueryMatchPrediction factor."
Authors: "pavelgur"
Responsibles: ["smikler", "yustuken", "diver"]
}
Factor {
Index: 910
CppName: "FI_LONG_CLICK_ANNOTATION_MATCH_PREDICTION"
Name: "LongClickAnnotationMatchPrediction"
Group: "Annotation"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: "LongClick is a factor in the annotation index, the AnnotationMatchPrediction factor."
Authors: "pavelgur"
Responsibles: ["smikler", "yustuken", "diver"]
}
Factor {
Index: 911
CppName: "FI_LONG_CLICK_BM15_AK4"
Name: "LongClickBm15AK4"
Group: "Annotation"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: "LongClick factor in the annotation index, factor Bm15AK4"
Authors: "pavelgur"
Responsibles: ["smikler", "yustuken", "diver"]
}
Factor {
Index: 912
CppName: "FI_LONG_CLICK_BOCM_WEIGHTED_W1K3"
Name: "LongClickBocmWeightedW1K3"
Group: "Annotation"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: "LongClick factor in the annotational index, BocmWeightedW1K3 factor."
Authors: "pavelgur"
Responsibles: ["smikler", "yustuken", "diver"]
}
Factor {
Index: 913
CppName: "FI_SPLIT_DWELL_TIME_QUERY_MATCH_PREDICTION"
Name: "SplitDwellTimeQueryMatchPrediction"
Group: "Annotation"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: "SplitDwellTime factor in the annotation index, QueryMatchPrediction factor."
Authors: "pavelgur"
Responsibles: ["smikler", "yustuken", "diver"]
}
Factor {
Index: 914
CppName: "FI_SPLIT_DWELL_TIME_ANNOTATION_MATCH_PREDICTION"
Name: "SplitDwellTimeAnnotationMatchPrediction"
Group: "Annotation"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: "SplitDwellTime is a factor in the annotation index, the AnnotationMatchPrediction factor."
Authors: "pavelgur"
Responsibles: ["smikler", "yustuken", "diver"]
}
Factor {
Index: 915
CppName: "FI_BQPR_QUERY_MATCH_PREDICTION"
Name: "BQPRQueryMatchPrediction"
Group: "Annotation"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_BROWSER, TG_USER_EXT_DATA, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: "The BQPR factor in the annotated index, the QueryMatchPrediction factor."
Authors: "smikler"
Responsibles: ["smikler", "yustuken", "diver"]
}
Factor {
Index: 916
CppName: "FI_BQPR_ANNOTATION_MATCH_PREDICTION"
Name: "BQPRAnnotationMatchPrediction"
Group: "Annotation"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_BROWSER, TG_USER_EXT_DATA, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: "BQPR is a factor in the annotation index and the factor AnnotationMatchPrediction."
Authors: "smikler"
Factor {
Index: 917
CppName: "FI_YABAR_VISITS_QUERY_MATCH_PREDICTION"
Name: "YabarVisitsQueryMatchPrediction"
Group: "Annotation"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_BROWSER, TG_USER_EXT_DATA, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: "YabarVisits factor in the annotation index, QueryMatchPrediction factor."
Authors: ["akhropov", "ilnurkh"]
Responsibles: ["smikler", "yustuken", "diver"]
}
Factor {
Index: 918
CppName: "FI_YABAR_VISITS_ANNOTATION_MATCH_PREDICTION"
Name: "YabarVisitsAnnotationMatchPrediction"
Group: "Annotation"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_BROWSER, TG_USER_EXT_DATA, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: "YabarVisits factor in annotation index, AnnotationMatchPrediction factor"
Authors: ["akhropov", "ilnurkh"]
Responsibles: ["smikler", "yustuken", "diver"]
}
Factor {
Index: 919
CppName: "FI_YABAR_TIME_QUERY_MATCH_PREDICTION"
Name: "YabarTimeQueryMatchPrediction"
Group: "Annotation"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_BROWSER, TG_USER_EXT_DATA, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: "YabarTime factor in annotation index, factor QueryMatchPrediction"
Authors: ["akhropov", "ilnurkh"]
Responsibles: ["smikler", "yustuken", "diver"]
}
Factor {
Index: 920
CppName: "FI_YABAR_TIME_ANNOTATION_MATCH_PREDICTION"
Name: "YabarTimeAnnotationMatchPrediction"
Group: "Annotation"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_BROWSER, TG_USER_EXT_DATA, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: "YabarTime factor in the annotation index, factor AnnotationMatchPrediction."
Authors: ["akhropov", "ilnurkh"]
Responsibles: ["smikler", "yustuken", "diver"]
}
Factor {
Index: 921
CppName: "FI_SIMPLE_CLICK_QUERY_MATCH_PREDICTION"
Name: "SimpleClickQueryMatchPrediction"
Group: "Annotation"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: "SimpleClick factor in the annotation index, QueryMatchPrediction factor."
Authors: "monnoroch"
Responsibles: ["smikler", "yustuken", "diver"]
}
Factor {
Index: 922
CppName: "FI_SIMPLE_CLICK_ANNOTATION_MATCH_PREDICTION"
Name: "SimpleClickAnnotationMatchPrediction"
Group: "Annotation"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: "SimpleClick factor in the annotated index, AnnotationMatchPrediction factor."
Authors: "monnoroch"
Responsibles: ["smikler", "yustuken", "diver"]
}
Factor {
Index: 923
CppName: "FI_LONG_CLICK_BOCM_PLAIN"
Name: "LongClickBocmPlain"
Group: "Annotation"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: "LongClick factor in the annotational index, factor BocmPlain."
Authors: "pavelgur"
Responsibles: ["smikler", "yustuken", "diver"]
}
Factor {
Index: 924
CppName: "FI_RANDOM_LOG_DBM35_XFACTOR_FULL_MATCH_PREDICTION"
Name: "RandomLogDBM35XfactorFullMatchPrediction"
Ticket: "FACTOR-579"
Wiki: "<https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/RandomLogDBM35>"
Group: "Annotation"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED, TG_COLLABORATED, TG_REMOVED]
Countries: [CNT_TR]
Description: "The result of collaborative filtering based on the FI_DBM35 factor from random log in the annotated index, factor FullMatchPrediction."
Authors: ["avatar", "alsafr", "akhropov"]
Responsibles: ["smikler", "yustuken", "diver"]
}
Factor {
Index: 925
CppName: "FI_RANDOM_LOG_DBM35_XFACTOR_ANNOTATION_MATCH_PREDICTION"
Name: "RandomLogDBM35XfactorAnnotationMatchPrediction"
Ticket: "FACTOR-579"
Wiki: "<https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/RandomLogDBM35>"
Group: "Annotation"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED, TG_COLLABORATED, TG_REMOVED]
Countries: [CNT_TR]
Description: "The result of collaborative filtering based on the FI_DBM35 factor from random log in the annotation index, factor AnnotationMatchPrediction."
Authors: ["avatar", "alsafr", "akhropov"]
Responsibles: ["smikler", "yustuken", "diver"]
}
Factor {
Index: 926
CppName: "FI_ONE_CLICK_SYNONYM_MATCH_PREDICTION"
Name: "OneClickSynonymMatchPrediction"
Group: "Annotation"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: "The result of collaborative filtering based on the OneClick factor from random log in the annotation index, SynonymMatchPrediction factor."
Authors: ["alsafr", "pavelgur"]
Responsibles: ["smikler", "yustuken", "diver"]
}
Factor {
Index: 927
CppName: "FI_ONE_CLICK_FULL_MATCH_PREDICTION"
Name: "OneClickFullMatchPrediction"
Group: "Annotation"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: "OneClick factor in the annotation index, factor FullMatchPrediction."
Authors: ["alsafr", "pavelgur"]
Responsibles: ["smikler", "yustuken", "diver"]
}
Factor {
Index: 928
CppName: "FI_ONE_CLICK_VALUE_WCM_AVG"
Name: "OneClickValueWcmAvg"
Group: "Annotation"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: "OneClick factor in the annotation index, factor ValueWcmAvg"
Authors: ["alsafr", "pavelgur"]
Responsibles: ["smikler", "yustuken", "diver"]
}
Factor {
Index: 929
CppName: "FI_ONE_CLICK_BOCM_WEIGHTED_MAX_K1"
Name: "OneClickBocmWeightedMaxK1"
Group: "Annotation"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: "OneClick factor in the annotation index, factor BocmWeightedMaxK1."
Authors: ["alsafr", "pavelgur"]
Responsibles: ["smikler", "yustuken", "diver"]
}
Factor {
Index: 930
CppName: "FI_ONE_CLICK_BM15_STRICT_K2"
Name: "OneClickBm15StrictK2"
Group: "Annotation"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: "OneClick factor in the annotation index, factor Bm15StrictK2."
Authors: ["alsafr", "pavelgur"]
Responsibles: ["smikler", "yustuken", "diver"]
}
Factor {
Index: 931
CppName: "FI_ONE_CLICK_BM15_MAX_K3"
Name: "OneClickBm15MaxK3"
Group: "Annotation"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: "OneClick factor in the annotation index, factor Bm15MaxK3"
Authors: ["alsafr", "pavelgur"]
Responsibles: ["smikler", "yustuken", "diver"]
}
Factor {
Index: 932
CppName: "FI_ONE_CLICK_BCLM_PLAIN_W1K3"
Name: "OneClickBclmPlainW1K3"
Group: "Annotation"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: "OneClick factor in the annotational index, factor BclmPlainW1K3"
Authors: ["alsafr", "pavelgur"]
Responsibles: ["smikler", "yustuken", "diver"]
}
Factor {
Index: 933
CppName: "FI_ONE_CLICK_VALUE_WCM_MAX"
Name: "OneClickValueWcmMax"
Group: "Annotation"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: "OneClick factor in the annotation index, factor ValueWcmMax."
Authors: ["alsafr", "pavelgur"]
Responsibles: ["smikler", "yustuken", "diver"]
}
Factor {
Index: 934
CppName: "FI_ONE_CLICK_VALUE_WCM_PREDICTION"
Name: "OneClickValueWcmPrediction"
Group: "Annotation"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: "OneClick factor in the annotated index, factor ValueWcmPrediction."
Authors: ["alsafr", "pavelgur"]
Responsibles: ["smikler", "yustuken", "diver"]
}
Factor {
Index: 935
CppName: "FI_ONE_CLICK_BCLM_WEIGHTED_K3"
Name: "OneClickBclmWeightedK3"
Group: "Annotation"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: "OneClick factor in the annotation index, factor BclmWeightedK3."
Authors: ["alsafr", "pavelgur"]
Responsibles: ["smikler", "yustuken", "diver"]
}
Factor {
Index: 936
CppName: "FI_BQPR_BOCM_WEIGHTED_W1_K3"
Name: "BQPRBocmWeightedW1K3"
Group: "Annotation"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_BROWSER, TG_USER_EXT_DATA, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: "BQPR factor in the annotational index, factor BocmWeightedW1K3."
Authors: "smikler"
Responsibles: ["smikler", "yustuken", "diver"]
}
Factor {
Index: 937
CppName: "FI_BQPR_BM15_STRICT_K2"
Name: "BQPRBm15StrictK2"
Group: "Annotation"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_BROWSER, TG_USER_EXT_DATA, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: "BQPR factor in the annotation index, factor Bm15StrictK2."
Authors: "smikler"
Responsibles: ["smikler", "yustuken", "diver"]
}
Factor {
Index: 938
CppName: "FI_SPLIT_DWELL_BOCM_WEIGHTED_MAX_K1"
Name: "SplitDwellTimeBocmWeightedMaxK1"
Group: "Annotation"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: "SplitDwellTime factor in the annotated index, BocmWeightedMaxK1 factor."
Authors: "pavelgur"
Responsibles: ["smikler", "yustuken", "diver"]
}
Factor {
Index: 939
CppName: "FI_SPLIT_DWELL_TIME_FULL_MATCH_PREDICTION"
Name: "SplitDwellTimeFullMatchPrediction"
Group: "Annotation"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: "SplitDwellTime factor in the annotation index, factor FullMatchPrediction."
Authors: "pavelgur"
Responsibles: ["smikler", "yustuken", "diver"]
}
Factor {
Index: 940
CppName: "FI_SPLIT_DWELL_TIME_VALUE_WCM_AVG"
Name: "SplitDwellTimeValueWcmAvg"
Group: "Annotation"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: "SplitDwellTime factor in annotational index, ValueWcmAvg factor."
Authors: "pavelgur"
Responsibles: ["smikler", "yustuken", "diver"]
}
Factor {
Index: 941
CppName: "FI_CORRECTED_CTR_BM15_STRICT_K2"
Name: "CorrectedCtrBm15StrictK2"
Ticket: "FACTOR-468"
Group: "Annotation"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_FILTER, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_1832D, TG_USERFEAT_SEARCH_DWELL_TIME, TG_USERFEAT_USF, TG_FORMULA_2245_DEP_2, TG_DEPRECATED]
Description: "CorrectedCtrReg factor in annotation index, Bm15StrictK2 factor"
Authors: ["alsafr", "smikler"]
Responsibles: ["smikler", "yustuken", "diver"]
}
Factor {
Index: 942
CppName: "FI_FRACTION_OF_QUERIES_WITH_GEO_PREDICTION"
Name: "FractionOfQueriesWithGeoPredicted"
DependsOn: [{Feature: ["FractionOfQueriesWithGeoPredicted"], Slice: "begemot_query_factors"}]
Ticket: "FACTOR-508"
Group: "Query"
Tags: [TG_QUERY_ONLY, TG_USER_SEARCH, TG_LOCALIZED_COUNTRY, TG_DYNAMIC, TG_L2, TG_DEPRECATED]
Countries: [CNT_ALL]
Description: "Prediction of the percentage of queries with geolocation based on set of words built for the query."
Authors: ["yazevnul"]
Responsibles: ["yazevnul", "esoloviev"] }
Factor {
Index: 943
CppName: "FI_URL_IS_EXACT"
Name: "IsExactUrl"
DependsOn: [{Feature: ["IsExactUrl"], Slice: "begemot_query_factors"}]
Tags: [TG_BINARY, TG_DYNAMIC, TG_QUERY_ONLY, TG_OFTEN_ZERO, TG_L2, TG_DEPRECATED]
Description: "The query is the URL with accuracy to dots and spaces - the rule “isurl” is used."
Ticket: "FACTOR-682"
Authors: ["mbusel", "smikler"]
Responsibles: "mbusel"
}
Factor {
Index: 944
CppName: "FI_RANDOM_LOG_DBM35_XFACTOR_VALUE_WCM_MAX"
Name: "RandomLogDBM35XfactorValueWcmMax"
Ticket: "FACTOR-579"
Wiki: "<https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/RandomLogDBM35>"
Group: "Annotation"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED, TG_COLLABORATED, TG_REMOVED]
Countries: [CNT_TR]
Description: "The result of collaborative filtering for the FI_DBM35 factor from random log in the annotation index, factor ValueWcmMax."
Authors: ["avatar", "alsafr", "akhropov"]
Responsibles: ["smikler", "yustuken", "diver"]
}
Factor {
Index: 945
CppName: "FI_RANDOM_LOG_DBM35_XFACTOR_VALUE_WCM_AVG"
Name: "RandomLogDBM35XfactorValueWcmAvg"
Ticket: "FACTOR-579"
Wiki: "<https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/RandomLogDBM35>"
Group: "Annotation"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED, TG_COLLABORATED, TG_REMOVED]
Countries: [CNT_TR]
Description: "Result of collaborative filtering for factor FI_DBM35 from random log in annotation index, factor ValueWcmAvg"
Authors: ["avatar", "alsafr", "akhropov"]
Responsibles: ["smikler", "yustuken", "diver"]
}
Factor {
Index: 946
CppName: "FI_RANDOM_LOG_DBM35_XFACTOR_BM15_STRICK_K2"
Name: "RandomLogDBM35XfactorBm15StrictK2"
Ticket: "FACTOR-579"
Wiki: "<https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/RandomLogDBM35>"
Group: "Annotation"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED, TG_COLLABORATED, TG_REMOVED]
Countries: [CNT_TR]
Description: "Result of collaborative filtering for factor FI_DBM35 based on random log in annotation index, factor Bm15StrictK2"
Authors: ["avatar", "alsafr", "akhropov"]
Responsibles: ["smikler", "yustuken", "diver"]
}
Factor {
Index: 947
CppName: "FI_RANDOM_LOG_DBM35_XFACTOR_BCLM_PLAIN_W1_k3"
Name: "RandomLogDBM35XfactorBclmPlainW1K3"
Ticket: "FACTOR-579"
Wiki: "<https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/RandomLogDBM35>"
Group: "Annotation"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED, TG_COLLABORATED, TG_REMOVED]
Countries: [CNT_TR]
Description: "Result of collaborative filtering for factor FI_DBM35 based on random log in annotation index, factor BclmPlainW1K3"
Authors: ["avatar", "alsafr", "akhropov"]
Responsibles: ["smikler", "yustuken", "diver"]
}
Factor {
Index: 948
CppName: "FI_RANDOM_LOG_DBM35_XFACTOR_BCLM_WEIGHTED_K3"
Name: "RandomLogDBM35XfactorBclmWeightedK3"
Ticket: "FACTOR-579"
Wiki: "<https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/RandomLogDBM35>"
Group: "Annotation"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED, TG_COLLABORATED, TG_REMOVED]
Countries: [CNT_TR]
Description: "Result of collaborative filtering for factor FI_DBM35 based on random log in annotation index, factor BclmWeightedK3"
Authors: ["avatar", "alsafr", "akhropov"]
Responsibles: ["smikler", "yustuken", "diver"]
}
Factor {
Index: 949
CppName: "FI_RANDOM_LOG_DBM35_XFACTOR_BOCM_WEIGHTED_K3"
Name: "RandomLogDBM35XfactorBocmWeightedW1K3"
Ticket: "FACTOR-579"
Wiki: "<https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/RandomLogDBM35>"
Group: "Annotation"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED, TG_COLLABORATED, TG_REMOVED]
Countries: [CNT_TR]
Description: "Result of collaborative filtering for factor FI_DBM35 based on random log in annotation index, factor BocmWeightedW1K3"
Authors: ["avatar", "alsafr", "akhropov"]
Responsibles: ["smikler", "yustuken", "diver"]
}
Factor {
Index: 950
CppName: "FI_CORRECTED_CTR_XFACTOR_ANNOTATION_MATCH_PREDICTION"
Name: "CorrectedCtrXfactorAnnotationMatchPrediction"
Ticket: "FACTOR-716"
Wiki: "<https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/QueryUrlCorrectedCtrXfactor>"
Group: "Annotation"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_COLLABORATED, TG_ANNOTATION_NOFILTER, TG_DEPRECATED, TG_REMOVED]
Description: "Corrected trX factor in the innovation index, Annotation Match Prediction factor"
Authors: ["vvp", "alsafr", "avatar"]
Responsibles: ["yustuken", "diver", "avatar"]
}
Factor {
Index: 951
CppName: "FI_CORRECTED_CTR_XFACTOR_QUERY_MATCH_PREDICTION"
Name: "CorrectedCtrXfactorQueryMatchPrediction"
Ticket: "FACTOR-716"
Wiki: "<https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/QueryUrlCorrectedCtrXfactor>"
Group: "Annotation"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_COLLABORATED, TG_ANNOTATION_NOFILTER, TG_DEPRECATED, TG_REMOVED]
Description: "Corrected trX factor in innovation index, Query Match Prediction factor"
Authors: ["vvp", "alsafr", "avatar"]
Responsibles: ["yustuken", "diver", "avatar"]
}
Factor {
Index: 952
CppName: "FI_CORRECTED_CTR_XFACTOR_VALUE_WCM_MAX"
Name: "CorrectedCtrXfactorValueWcmMax"
Ticket: "FACTOR-716"
Wiki: "<https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/QueryUrlCorrectedCtrXfactor>"
Group: "Annotation"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_COLLABORATED, TG_ANNOTATION_NOFILTER, TG_DEPRECATED, TG_REMOVED]
Description: "CorrectedCtrXfactor in annotation index, ValueWcmMax factor"
Authors: ["vvp", "alsafr", "avatar"]
Responsibles: ["yustuken", "diver", "avatar"]
}
Factor {
Index: 953
CppName: "FI_CORRECTED_CTR_XFACTOR_VALUE_WCM_AVG"
Name: "CorrectedCtrXfactorValueWcmAvg"
Ticket: "FACTOR-716"
Wiki: "<https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/QueryUrlCorrectedCtrXfactor>"
Group: "Annotation"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_COLLABORATED, TG_ANNOTATION_NOFILTER, TG_DEPRECATED, TG_REMOVED]
Description: "Corrected trX factor in innovation index, Value Vcm Avg factor"
Authors: ["vvp", "alsafr", "avatar"]
Responsibles: ["yustuken", "diver", "avatar"]
}
Factor {
Index: 954
CppName: "FI_CORRECTED_CTR_XFACTOR_BOCM_WEIGHTED_W1K3"
Name: "CorrectedCtrXfactorBocmWeightedW1K3"
Ticket: "FACTOR-716"
Wiki: "<https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/QueryUrlCorrectedCtrXfactor>"
Group: "Annotation"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_COLLABORATED, TG_ANNOTATION_NOFILTER, TG_DEPRECATED, TG_REMOVED]
Description: "CorrectedCtrXfactor in annotation index, BocmWeightedW1K3 factor"
Authors: ["vvp", "alsafr", "avatar"]
Responsibles: ["yustuken", "diver", "avatar"]
}
Factor {
Index: 955
CppName: "FI_CORRECTED_CTR_XFACTOR_BCLM_PLAIN_K3"
Name: "CorrectedCtrXfactorBclmPlainK3"
Ticket: "FACTOR-716"
Wiki: "<https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/QueryUrlCorrectedCtrXfactor>"
Group: "Annotation"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_COLLABORATED, TG_ANNOTATION_NOFILTER, TG_DEPRECATED, TG_REMOVED]
Description: "CorrectedCtrXfactor in annotation index, BclmPlainK3 factor"
Authors: ["vvp", "alsafr", "avatar"]
Responsibles: ["yustuken", "diver", "avatar"]
}
Factor {
Index: 956
CppName: "FI_CORRECTED_CTR_XFACTOR_BCLM_MIX_PLAIN_W1K1"
Name: "CorrectedCtrXfactorBclmMixPlainW1K1"
Ticket: "FACTOR-716"
Wiki: "<https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/QueryUrlCorrectedCtrXfactor>"
Group: "Annotation"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_COLLABORATED, TG_ANNOTATION_NOFILTER, TG_DEPRECATED, TG_REMOVED]
Description: "CorrectedCtrXfactor in annotation index, BclmMixPlainW1K1 factor"
Authors: ["vvp", "alsafr", "avatar"]
Responsibles: ["yustuken", "diver", "avatar"]
}
Factor {
Index: 957
CppName: "FI_ALICE_TIMESPENT_SUFFIX_SUM"
Name: "AliceTimespentSuffixSum"
Tags: [TG_UNIMPLEMENTED, TG_DYNAMIC, TG_DOC, TG_USER, TG_USER_SEARCH, TG_URL_TEXT, TG_DOC_TEXT, TG_DOC_CONTENT, TG_NEURAL, TG_UNDOCUMENTED, TG_UNUSED, TG_ALICE_MUSIC, TG_RTMODELS_SERVICE, TG_ALLOW_USE_FOR_ALICE]
Description: "Prediction of the total duration of the session until its end, subject to the implementation of this query-document pair"
Ticket: "SEARCHSPEC-132"
Authors: "an-to-nen-ko"
Responsibles: "an-to-nen-ko"
}
Factor {
Index: 958
CppName: "FI_ALICE_TIMESPENT"
Name: "AliceTimespent"
Tags: [TG_UNIMPLEMENTED, TG_DYNAMIC, TG_DOC, TG_USER, TG_USER_SEARCH, TG_URL_TEXT, TG_DOC_TEXT, TG_DOC_CONTENT, TG_NEURAL, TG_UNDOCUMENTED, TG_UNUSED, TG_ALICE_MUSIC, TG_RTMODELS_SERVICE, TG_ALLOW_USE_FOR_ALICE]
Description: "Predicting the contribution of this query-document pair to the duration of the session"
Ticket: "SEARCHSPEC-132"
Authors: "an-to-nen-ko"
Responsibles: "an-to-nen-ko"
}
Factor {
Index: 959
CppName: "FI_SAMPLE_PERIOD_DAY_FRC_VALUE_WCM_AVG"
Name: "SamplePeriodDayFrcValueWcmAvg"
Ticket: "FACTOR-605"
Wiki: "<https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/sampleperiod>"
Group: "Annotation"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: "SamplePeriodDayFrc factor in annotation index, factor ValueWcmAvg"
Authors: "monnoroch"
Responsibles: ["yustuken", "diver"]
}
Factor {
Index: 960
CppName: "FI_SAMPLE_PERIOD_DAY_FRC_BM15_MAX_K3"
Name: "SamplePeriodDayFrcBm15MaxK3"
Ticket: "FACTOR-605"
Wiki: "<https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/sampleperiod>"
Group: "Annotation"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: "SamplePeriodDayFrc factor in annotation index, Bm15MaxK3 factor"
Authors: "monnoroch"
Responsibles: ["yustuken", "diver"]
}
Factor {
Index: 961
CppName: "FI_SAMPLE_PERIOD_DAY_FRC_BOCM_WEIGHTED_K3"
Name: "SamplePeriodDayFrcBocmWeightedK3"
Ticket: "FACTOR-605"
Wiki: "<https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/sampleperiod>"
Group: "Annotation"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: "SamplePeriodDayFrc factor in annotation index, factor BocmWeightedK3"
Authors: "monnoroch"
Responsibles: ["yustuken", "diver"]
}
Factor {
Index: 962
CppName: "FI_SAMPLE_PERIOD_DAY_FRC_BOCM_DOUBLE_K5"
Name: "SamplePeriodDayFrcBocmDoubleK5"
Ticket: "FACTOR-605"
Wiki: "<https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/sampleperiod>"
Group: "Annotation"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: "SamplePeriodDayFrc factor in annotation index, BocmDoubleK5 factor"
Authors: "monnoroch"
Responsibles: ["yustuken", "diver"]
}
Factor {
Index: 963
CppName: "FI_SPLIT_DWELL_TIME_BM15_MAX_K3"
Name: "SplitDwellTimeBm15MaxK3"
Group: "Annotation"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: "SplitDwellTime factor in annotation index, Bm15MaxK3 factor"
Authors: "pavelgur"
Responsibles: ["yustuken", "diver"]
}
Factor {
Index: 964
CppName: "FI_SIMPLE_CLICK_BCLM_WEIGHTED_K3"
Name: "SimpleClickBclmWeightedK3"
Group: "Annotation"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: "SimpleClick factor in annotation index, BclmWeightedK3 factor"
Authors: "monnoroch"
Responsibles: ["yustuken", "diver"]
}
Factor {
Index: 965
CppName: "FI_ALICE_MAX_PERCENT_PLAYED"
Name: "AliceMaxPercentPlayed"
Tags: [TG_UNIMPLEMENTED, TG_DYNAMIC, TG_DOC, TG_USER, TG_USER_SEARCH, TG_URL_TEXT, TG_DOC_TEXT, TG_DOC_CONTENT, TG_NEURAL, TG_UNDOCUMENTED, TG_UNUSED, TG_ALICE_MUSIC, TG_RTMODELS_SERVICE, TG_ALLOW_USE_FOR_ALICE]
Description: "Prediction of the percentage of track duration that will be played if this query-track pair is implemented"
Ticket: "SEARCHSPEC-132"
Authors: "an-to-nen-ko"
Responsibles: "an-to-nen-ko"
}
Factor {
Index: 966
CppName: "FI_WEIGHTED_UNMATCH_URL_PREDICTED_USER_REGION"
Name: "WeightedUnMatchUrlPredictedAndUserRegion"
Ticket: "BUKI-2076"
Wiki: "<https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/MatchUrlPredictedAndUserRegion>"
Tags: [TG_STATIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_URL_TEXT, TG_L2, TG_L3_OVERWRITE, TG_NN_OVER_FEATURES_USE]
Description: "The probability that the region predicted by the yweb/robot/urlgeo_ml model is correct, if the city is predicted"
Authors: ["esoloviev", "mbusel"]
Responsibles: ["mbusel"]
}
Factor {
Index: 967
CppName: "FI_PSE_FRC_BROWSER_ANNOTATION_MATCH_PREDICTION"
Name: "PopularSEFRCBrowserAnnotationMatchPrediction"
Ticket: "FACTOR-675"
Group: "Annotation"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_ANNOTATION_NOFILTER, TG_DEPRECATED, TG_BROWSER]
Countries: CNT_RELEV
Description: "PopularSEFRCBrowser factor in innovation index, Annotation Match Prediction factor"
Authors: ["mbusel", "tsimkha"]
Responsibles: ["mbusel", "yustuken", "diver"]
}
Factor {
Index: 968
CppName: "FI_PSE_FRC_BROWSER_SYNONYM_MATCH_PREDICTION"
Name: "PopularSEFRCBrowserSynonymMatchPrediction"
Ticket: "FACTOR-675"
Group: "Annotation"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_ANNOTATION_NOFILTER, TG_DEPRECATED, TG_BROWSER]
Description: "PopularSEFRCCBrowser factor in innovation index, Synonym Match Prediction factor"
Countries: CNT_RELEV
Authors: ["mbusel", "tsimkha"]
Responsibles: ["mbusel", "yustuken", "diver"]
}
Factor {
Index: 969
CppName: "FI_PSE_FRC_BROWSER_VALUE_WCM_PREDICTION"
Name: "PopularSEFRCBrowserValueWcmPrediction"
Ticket: "FACTOR-675"
Group: "Annotation"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_ANNOTATION_NOFILTER, TG_DEPRECATED, TG_BROWSER]
Description: "PopularSEFRCBrowser factor in annotation index, factor ValueWcmPrediction"
Countries: CNT_RELEV
Authors: ["mbusel", "tsimkha"]
Responsibles: ["mbusel", "yustuken", "diver"]
}
Factor {
Index: 970
CppName: "FI_PSE_FRC_BROWSER_BCLM_WEIGHTED_V2K3"
Name: "PopularSEFRCBrowserBclmWeightedV2K3"
Ticket: "FACTOR-675"
Group: "Annotation"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_ANNOTATION_NOFILTER, TG_DEPRECATED, TG_BROWSER]
Description: "PopularSEFRCCBrowser factor in annotation index, BclmWeightedV2K3 factor"
Countries: CNT_RELEV
Authors: ["mbusel", "tsimkha"]
Responsibles: ["mbusel", "yustuken", "diver"]
}
Factor {
Index: 971
CppName: "FI_PSE_FRC_BROWSER_BCLM_MIX_PLAIN_W1K1"
Name: "PopularSEFRCBrowserBclmMixPlainW1K1"
Ticket: "FACTOR-675"
Group: "Annotation"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_ANNOTATION_NOFILTER, TG_DEPRECATED, TG_BROWSER]
Description: "PopularSEFRCCBrowser factor in annotation index, factor BclmMixPlainW1K1"
Countries: CNT_RELEV
Authors: ["mbusel", "tsimkha"]
Responsibles: ["mbusel", "yustuken", "diver"]
}
Factor {
Index: 972
CppName: "XLR_ANNOTATION_MATCH_PREDICTION"
Name: "XLRAnnotationMatchPrediction"
Group: "Xref"
Ticket: "BUKI-2408"
Wiki: "<https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/xlrannotationmatchprediction>"
Tags: [TG_DYNAMIC, TG_DOC, TG_LINK_TEXT, TG_DEPRECATED]
Description: "It is calculated based on the link index. Max(sum(idf)) based on all links that are subsets of query / sum(idf) for query"
Authors: "edik"
Responsibles: "edik"
}
Factor {
Index: 973
CppName: "FI_ONE_CLICK_ANNOTATION_MATCH_PREDICTION_WEIGHTED"
Name: "OneClickAnnotationMatchPredictionWeighted"
Group: "Annotation"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: "OneClick factor in annotation index, AnnotationMatchPredictionWeighted factor"
Authors: ["alsafr", "pavelgur", "edik"]
Responsibles: ["edik", "yustuken", "diver"]
}
Factor {
Index: 974
CppName: "FI_LONG_CLICK_ANNOTATION_MATCH_PREDICTION_WEIGHTED"
Name: "LongClickAnnotationMatchPredictionWeighted"
Group: "Annotation"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: "LongClick factor in annotation index, AnnotationMatchPredictionWeighted factor"
Authors: ["pavelgur", "edik"]
Responsibles: ["edik", "yustuken", "diver"]
}
Factor {
Index: 975
CppName: "FI_YABAR_TIME_ANNOTATION_MATCH_PREDICTION_WEIGHTED"
Name: "YabarTimeAnnotationMatchPredictionWeighted"
Group: "Annotation"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_BROWSER, TG_USER_EXT_DATA, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: "YabarTime factor in annotation index, AnnotationMatchPredictionWeighted factor"
Authors: ["akhropov", "ilnurkh", "edik"]
Responsibles: ["edik", "yustuken", "diver"]
}
Factor {
Index: 976
CppName: "FI_PAGE_HAS_MAPS_API"
Name: "PageHasMapsApi"
Tags: [TG_STATIC, TG_DOC, TG_BINARY, TG_NN_OVER_FEATURES_USE]
Description: "It is equal to one if the page connects the js-api of any geo-data provider"
Wiki: "<https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/PageHasMapsApi>"
Authors: ["ilnurkh"]
Responsibles: ["ilnurkh"]
}
Factor {
Index: 977
CppName: "FI_LONG_CLICK_SP_ANNOTATION_MATCH_PREDICTION"
Name: "LongClickSPAnnotationMatchPrediction"
Group: "Annotation"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: "LongClickSamplePeriod factor in innovation index, Annotation Match Prediction factor"
Ticket: "FACTOR-685"
Authors: ["tsimkha", "pavelgur"]
Responsibles: ["tsimkha", "yustuken", "diver"]
}
Factor {
Index: 978
CppName: "FI_LONG_CLICK_SP_QUERY_MATCH_PREDICTION"
Name: "LongClickSPQueryMatchPrediction"
Group: "Annotation"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: "LongClickSamplePeriod factor in innovation index, Query Match Prediction factor"
Ticket: "FACTOR-685"
Authors: ["tsimkha", "pavelgur"]
Responsibles: ["tsimkha", "yustuken", "diver"]
}
Factor {
Index: 979
CppName: "FI_LONG_CLICK_SP_VALUE_WCM_AVG"
Name: "LongClickSPValueWcmAvg"
Group: "Annotation"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: "LongClickSamplePeriod factor in annotation index, factor ValueWcmAvg"
Ticket: "FACTOR-685"
Authors: ["tsimkha", "pavelgur"]
Responsibles: ["tsimkha", "yustuken", "diver"]
}
Factor {
Index: 980
CppName: "FI_LONG_CLICK_SP_VALUE_WCM_PREDICTION"
Name: "LongClickSPValueWcmPrediction"
Group: "Annotation"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: "LongClickSamplePeriod factor in annotation index, factor ValueWcmPrediction"
Ticket: "FACTOR-685"
Authors: ["tsimkha", "pavelgur"]
Responsibles: ["tsimkha", "yustuken", "diver"]
}
Factor {
Index: 981
CppName: "FI_LONG_CLICK_SP_BCLM_PLAIN_W1K3"
Name: "LongClickSPBclmPlainW1K3"
Group: "Annotation"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: "LongClickSamplePeriod factor in annotation index, BclmPlainW1K3 factor"
Ticket: "FACTOR-685"
Authors: ["tsimkha", "pavelgur"]
Responsibles: ["tsimkha", "yustuken", "diver"]
}
Factor {
Index: 982
CppName: "FI_LONG_CLICK_SP_BCLM_WEIGHTED_K3"
Name: "LongClickSPBclmWeightedK3"
Group: "Annotation"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: "LongClickSamplePeriod factor in annotation index, BclmWeightedK3 factor"
Ticket: "FACTOR-685"
Authors: ["tsimkha", "pavelgur"]
Responsibles: ["tsimkha", "yustuken", "diver"]
}
Factor {
Index: 983
CppName: "FI_LONG_CLICK_SP_BOCM_WEIGHTED_W1K3"
Name: "LongClickSPBocmWeightedW1K3"
Group: "Annotation"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: "LongClickSamplePeriod factor in annotation index, factor BocmWeightedW1K3"
Ticket: "FACTOR-685"
Authors: ["tsimkha", "pavelgur"]
Responsibles: ["tsimkha", "yustuken", "diver"]
}
Factor {
Index: 984
CppName: "FI_LONG_CLICK_SP_BCLM_PLAIN_K5"
Name: "LongClickSPBclmPlainK5"
Group: "Annotation"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: "LongClickSamplePeriod factor in annotation index, BclmPlainK5 factor"
Ticket: "FACTOR-685"
Authors: ["tsimkha", "pavelgur"]
Responsibles: ["tsimkha", "yustuken", "diver"]
}
Factor {
Index: 985
CppName: "FI_LONG_CLICK_SP_BCLM_WEIGHTED_V2K3"
Name: "LongClickSPBclmWeightedV2K3"
Group: "Annotation"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: "LongClickSamplePeriod factor in annotation index, BclmWeightedV2K3 factor"
Ticket: "FACTOR-685"
Authors: ["tsimkha", "pavelgur"]
Responsibles: ["tsimkha", "yustuken", "diver"]
}
Factor {
Index: 986
CppName: "FI_LONG_CLICK_SP_BOCM_DOUBLE_K5"
Name: "LongClickSPBocmDoubleK5"
Group: "Annotation"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: "LongClickSamplePeriod factor in annotation index, factor BocmDoubleK5"
Ticket: "FACTOR-685"
Authors: ["tsimkha", "pavelgur"]
Responsibles: ["tsimkha", "yustuken", "diver"]
}
Factor {
Index: 987
CppName: "FI_LONG_CLICK_SP_BM15_STRICT_K2"
Name: "LongClickSPBm15StrictK2"
Group: "Annotation"
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: "LongClickSamplePeriod factor in annotation index, Bm15StrictK2 factor"
Ticket: "FACTOR-685"
Authors: ["tsimkha", "pavelgur"]
Responsibles: ["tsimkha", "yustuken", "diver"]
}
Factor {
Index: 988
CppName: "FI_URL_CLICKS_MAX_GEO_REGION_FRC_RATIO"
Name: "URLClicksMaxGeoRegionFRCRatio"
Ticket: "FACTOR-36"
Wiki: "<http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/URLClicksMaxGeoCityFRC>"
Tags: [TG_DOC, TG_DYNAMIC, TG_LOCALIZED_REGION, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_L2, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_90D, TG_USERFEAT_GEOCLICKS]
Description: "Normalized corrected clicks maximum ratio by query with user's city(gc=) mentioned equal by region"
Authors: "esoloviev"
Responsibles: ["tarum", "niknik"]
}
Factor {
Index: 989
CppName: "FI_URL_CLICKS_MAX_GEO_REGIONONLY_FRC_RATIO"
Name: "URLClicksMaxGeoRegionOnlyFRCRatio"
Ticket: "FACTOR-36"
Wiki: "<http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/URLClicksMaxGeoCityFRC>"
Tags: [TG_DOC, TG_DYNAMIC, TG_LOCALIZED_REGION, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_90D, TG_USERFEAT_GEOCLICKS]
Description: "Normalized corrected clicks maximum ratio by query with user's city(gc=) mentioned equal to user's region"
Authors: "esoloviev"
Responsibles: ["tarum", "niknik"]
}
Factor {
Index: 990
CppName: "FI_BQPR_SAMPLE_WCM_COVERAGE_MAX"
Name: "BQPRSampleWcmCoverageMax"
Group: "Annotation"
Ticket: "FACTOR-799"
Wiki: "<https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/BQPRSample>"
Tags: [TG_DOC, TG_DYNAMIC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_ANNOTATION_NOFILTER, TG_DEPRECATED, TG_BROWSER, TG_USER_EXT_DATA]
Description: "BQPR based on the sampled period. Annotation index. Factor WcmCoverageMax"
Authors: ["asandler"]
Responsibles: ["asandler", "avatar"]
}
Factor {
Index: 991
CppName: "FI_BQPR_SAMPLE_FULL_MATCH_PREDICTION"
Name: "BQPRSampleFullMatchPrediction"
Group: "Annotation"
Ticket: "FACTOR-799"
Wiki: "<https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/BQPRSample>"
Tags: [TG_DOC, TG_DYNAMIC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_ANNOTATION_NOFILTER, TG_DEPRECATED, TG_BROWSER, TG_USER_EXT_DATA]
Description: "BQPR based on the sampled period. Annotation index. FullMatchPrediction factor"
Authors: ["asandler"]
Responsibles: ["asandler", "avatar"]
}
Factor {
Index: 992
CppName: "FI_BQPR_SAMPLE_ANNOTATION_MATCH_PREDICTION_WEIGHTED"
Name: "BQPRSampleAnnotationMatchPredictionWeighted"
Group: "Annotation"
Ticket: "FACTOR-799"
Wiki: "<https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/BQPRSample>"
Tags: [TG_DOC, TG_DYNAMIC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_ANNOTATION_NOFILTER, TG_DEPRECATED, TG_BROWSER, TG_USER_EXT_DATA]
Description: "BQPR based on the sampled period. Annotation index. Factor AnnotationMatchPredictionWeighted"
Authors: ["asandler"]
Responsibles: ["asandler", "avatar"]
}
Factor {
Index: 993
CppName: "FI_BQPR_SAMPLE_VALUE_PCM_AVG"
Name: "BQPRSampleValuePcmAvg"
Group: "Annotation"
Ticket: "FACTOR-799"
Wiki: "<https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/BQPRSample>"
Tags: [TG_DOC, TG_DYNAMIC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_ANNOTATION_NOFILTER, TG_DEPRECATED, TG_BROWSER, TG_USER_EXT_DATA]
Description: "BQPR based on the sampled period. Annotation index. Factor ValuePcmAvg"
Authors: ["asandler"]
Responsibles: ["asandler", "avatar"]
}
Factor {
Index: 994
CppName: "FI_BQPR_SAMPLE_VALUE_WCM_AVG"
Name: "BQPRSampleValueWcmAvg"
Group: "Annotation"
Ticket: "FACTOR-799"
Wiki: "<https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/BQPRSample>"
Tags: [TG_DOC, TG_DYNAMIC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_ANNOTATION_NOFILTER, TG_DEPRECATED, TG_BROWSER, TG_USER_EXT_DATA]
Description: "BQPR based on the sampled period. Annotation index. Factor ValueWcmAvg"
Authors: ["asandler"]
Responsibles: ["asandler", "avatar"]
}
Factor {
Index: 995
CppName: "FI_BQPR_SAMPLE_BM15_V4_K5"
Name: "BQPRSampleBm15V4K8"
Group: "Annotation"
Ticket: "FACTOR-799"
Wiki: "<https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/BQPRSample>"
Tags: [TG_DOC, TG_DYNAMIC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_ANNOTATION_NOFILTER, TG_DEPRECATED, TG_BROWSER, TG_USER_EXT_DATA]
Description: "BQPR based on the sampled period. Annotation index. Factor Bm15V4K8"
Authors: ["asandler"]
Responsibles: ["asandler", "avatar"]
}
Factor {
Index: 996
CppName: "FI_BQPR_SAMPLE_BOCM_WEIGHTED_V4_K8"
Name: "BQPRSampleBocmWeightedV4K8"
Group: "Annotation"
Ticket: "FACTOR-799"
Wiki: "<https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/BQPRSample>"
Tags: [TG_DOC, TG_DYNAMIC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_ANNOTATION_NOFILTER, TG_DEPRECATED, TG_BROWSER, TG_USER_EXT_DATA]
Description: "BQPR based on the sampled period. Annotation index. Factor BocmWeightedV4K8"
Authors: ["asandler"]
Responsibles: ["asandler", "avatar"]
}
Factor {
Index: 997
CppName: "FI_BQPR_SAMPLE_WCM_MAX"
Name: "BQPRSampleWcmMax"
Group: "Annotation"
Ticket: "FACTOR-799"
Wiki: "<https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/BQPRSample>"
Tags: [TG_DOC, TG_DYNAMIC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_ANNOTATION_NOFILTER, TG_DEPRECATED, TG_BROWSER, TG_USER_EXT_DATA]
Description: "BQPR based on the sampled period. Annotation index. SampleWcmMax Factor"
Authors: ["asandler"]
Responsibles: ["asandler", "avatar"]
}
Factor {
Index: 998
CppName: "FI_BQPR_SAMPLE_SYNONYM_MATCH_PREDICTION"
Name: "BQPRSampleSynonymMatchPrediction"
Group: "Annotation"
Ticket: "FACTOR-799"
Wiki: "<https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/BQPRSample>"
Tags: [TG_DOC, TG_DYNAMIC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_ANNOTATION_NOFILTER, TG_DEPRECATED, TG_BROWSER, TG_USER_EXT_DATA]
Description: "BQPR based on the sampled period. Annotation index. SynonymMatchPrediction Factor"
Authors: ["asandler"]
Responsibles: ["asandler", "avatar"]
}
Factor {
Index: 999
CppName: "FI_BQPR_SAMPLE_ANNOTATION_MATCH_PREDICTION"
Name: "BQPRSampleAnnotationMatchPrediction"
Group: "Annotation"
Ticket: "FACTOR-799"
Wiki: "<https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/BQPRSample>"
Tags: [TG_DOC, TG_DYNAMIC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_ANNOTATION_NOFILTER, TG_DEPRECATED, TG_BROWSER, TG_USER_EXT_DATA]
Description: "BQPR based on the sampled period. Annotation index. AnnotationMatchPrediction factor"
Authors: ["asandler"]
Responsibles: ["asandler", "avatar"]
}
Factor {
Index: 1000
CppName: "FI_BQPR_SAMPLE_SUFFIX_MATCH_COUNT"
Name: "BQPRSampleSuffixMatchCount"
Group: "Annotation"
Ticket: "FACTOR-799"
Wiki: "<https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/BQPRSample>"
Tags: [TG_DOC, TG_DYNAMIC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_ANNOTATION_NOFILTER, TG_DEPRECATED, TG_BROWSER, TG_USER_EXT_DATA]
Description: "BQPR based on the sampled period. Annotation index. SuffixMatchCount factor"
Authors: ["asandler"]
Responsibles: ["asandler", "avatar"]
}