If you’re an SEO, knowing how content ranks is important for success in the SERPs.
Below is Yandex’s entire source code:
# Contains human-readable representation of NFactor::TCodeGenInput message (defined in factors_metadata.proto)
Group: [
datetime,
“domain”,
“Rapid Clicks”,
“RegHostStatic”,
“RegDocStatic”,
Regex,
LinkBM25,
“TextBM25”,
“TextAndLinkBM25”,
“BM25F”,
“best form”,
UrlBM25,
“PositionLanguageModel”,
“DBM25”,
AuxBM25,
“Annotations”,
“Tocm”,
“Bocm”,
“combinedabs”,
SWBM25,
“QI”
“Combined Sequences”,
“ExactGroups”,
“QSegments”,
“QueryWordSequencesSTR”,
“QueryWordSequencesLR”,
SynSet Locm,
“xref”,
“LegacyLR”,
“LegacyTR”,
“Dynamic”,
“BCLM”,
Link Forms,
“text forms”,
“RegWordHost”,
“Query”,
“QueryTitleSnippetCTR”
]
slice {
Name: “web_production”
Factor {
Index: 0
CppName: “FI_PAGE_RANK”
Name: “PR”
Wiki: “https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/PageRank”
AntiSeoUpperBound: 1.0
Tags: [TG_DOC, TG_LINK_GRAPH, TG_STATIC, TG_L2, TG_UNUSED]
Description: “Page rank. The factor is being remapped.”
Authors: “aavdonkin”
Responsibles: “aavdonkin”
}
Factor {
Index: 1
CppName: “FI_TEXT_RELEV”
Name: “TR”
AntiSeoUpperBound: 0.95
Group: “LegacyTR”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_REARR_USE, TG_UNDOCUMENTED, TG_NN_OVER_FEATURES_USE]
Description: “Text relevance (maxfreq is the frequency of the most frequent word, which makes sense of the length of the document).”
Authors: [“gulin”, “iseg”, “leo”, “maslov”]
Responsibles: [“gulin”, “leo”, “maslov”]
}
Factor {
Index: 2
CppName: “FI_LINK_RELEV”
Name: “LR”
AntiSeoUpperBound: 1.0
Group: “Dynamic”
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: “Link relevancy. Factor remapping.”
Authors: [“aavdonkin”, “gulin”, “leshch”, “melkov”]
Responsibles: [“aavdonkin”, “gulin”, “melkov”]
}
Factor {
Index: 3
CppName: “FI_PAGE_RANK_BONUS”
Name: “PrBonus”
Wiki: “https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/PageRankBonus”
Group: “Dynamic”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_BINARY, TG_OFTEN_ZERO, TG_NN_OVER_FEATURES_USE]
Description: “Priority bonus, priority 7 – text priority. The factor is binary, has a value of 0 for all one-word requests, and a value of 1 for almost all two or more word requests, except for a very small number of answers for which there is not a single link that passed the quorum, and the text also did not pass the quorum.”
Authors: [“gulin”, “leo”]
Responsibles: “pavelgur”
}
Factor {
Index: 4
CppName: “FI_TEXT_RELEV_ALL_WORDS”
Name: “TRp1”
Group: “LegacyTR”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_BINARY, TG_REARR_USE, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_NN_OVER_FEATURES_USE]
Description: “TR’s strict precedence is text priority – there are all query words somewhere in the document (while they pass query context restrictions, for example, both words should be in the same sentence).”
Authors: [“denplusplus”, “gulin”, “leo”]
Responsibles: [“alsafr”, “gulin”, “leo”]
}
Factor {
Index: 5
CppName: “FI_TEXT_RELEV_PHRASE”
Name: “TRp2”
Group: “LegacyTR”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_BINARY, TG_REARR_USE, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_REARR_USE, TG_NN_OVER_FEATURES_USE]
Description: “The phrase priority for TR is text priority – there are all query words in a row in the document.”
Authors: [“denplusplus”, “gulin”, “leo”]
Responsibles: [“alsafr”, “gulin”, “leo”]
}
Factor {
Index: 6
CppName: “FI_LINK_RELEV_ALL_WORDS”
Name: “LRp1”
Group: “Dynamic”
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: “(strict) have all query words in one link.”
Authors: [“gulin”, “leo”]
Responsibles: [“gulin”, “leo”]
}
Factor {
Index: 7
CppName: “FI_LINK_RELEV_PHRASE”
Name: “LRp2”
Group: “Dynamic”
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_DEPRECATED]
Description: “(phrase) has all query words in a row in one link.”
Authors: [“gulin”, “leo”]
Responsibles: [“gulin”, “leo”]
}
Factor {
Index: 8
CppName: “FI_TEXT_RELEV_TITLE”
Name: “TRtitle”
Group: “LegacyTR”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_BINARY, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_NN_OVER_FEATURES_USE]
Description: “The presence of the exact phrase (query text) in the title (more precisely, in the first sentence of the document). Contextual restrictions and stop words are taken into account exactly as in TRp2, i.e. factor[8] minors factor[5]”
Authors: [“denplusplus”, “gulin”, “leo”]
Responsibles: [“alsafr”, “gulin”, “leo”]
}
Factor {
Index: 9
CppName: “FI_TEXT_RELEV_WHOLE_HR_MATCHED”
Name: “TRhr”
Group: “LegacyTR”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_BINARY, TG_REARR_USE, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_NN_OVER_FEATURES_USE]
Description: “Met a segment that passed a quorum in which all postings are designated as having relevance BEST_RELEV (title or meta keywords).”
Authors: [“gulin”, “leo”]
Responsibles: [“gulin”, “leo”]
}
# TODO(FACTORDEL-65): replace with TG_REMOVED
Factor {
index: 10
CppName: “FI_REMOVED_10”
Name: “Removed_10”
Tags: [TG_UNUSED]
}
Factor {
Index: 11
CppName: “FI_NEWS”
Name: “News”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/Klassificacionnye?v=tkd#h45859-3”
Tags: [TG_HOST, TG_STATIC, TG_BINARY, TG_REARR_USE, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “This is news (determined by characteristic ((http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/Klassificacionnye?v=tkd#h45859-3 patterns in the url))).”
Authors: “gulin”
Responsibles: “gulin”
}
Factor {
Index: 12
CppName: “FI_SHOP”
Name: “Shop”
AntiSeoUpperBound: 1.0
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/Klassificacionnye?v=tkd#h45859-4”
Tags: [TG_HOST, TG_STATIC, TG_BINARY, TG_DEPRECATED, TG_OFTEN_ZERO]
Description: “This is a store offer (determined by the characteristic ((http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/Klassificacionnye?v=tkd#h45859-4 patterns in the url)))). Not used (deprecated)”
Authors: “gulin”
Responsibles: “gulin”
}
Factor {
index: 13
CppName: “FI_CATALOG”
Name: “Cat”
AntiSeoUpperBound: 1.0
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/Klassificacionnye?v=tkd#h45859-2”
Tags: [TG_HOST, TG_STATIC, TG_BINARY, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “This is a directory (determined by characteristic ((http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/Klassificacionnye?v=tkd#h45859-2 patterns in url)) or by Yandex – directory).”
Authors: “gulin”
Responsibles: “gulin”
}
Factor {
Index: 14
CppName: “FI_YA_BAR”
Name: “YaBar”
AntiSeoUpperBound: 1.0
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/YaBar”
Tags: [TG_BROWSER, TG_HOST, TG_STATIC, TG_USER, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_VISITS_ACTIVITY_DOWNLOADS, TG_USERFEAT]
Description: “Attendance from Bar – ((http://wiki.yandex-team.ru/AndrejjKostjagin/YaBarLog/HostStat Data Description)). Factor is remapping.”
Authors: [“kostyagin”, “somov”]
Responsibles: [“tarum”, “niknik”]
}
Factor {
Index: 15
CppName: “FI_LONG”
Name: “Long”
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_REARR_USE, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “Long document (the longer the document, the greater the value of the factor).”
Authors: “gulin”
Responsibles: “gulin”
}
Factor {
Index: 16
CppName: “FI_HIT_WEIGHT”
Name: “TRhitw”
Group: “LegacyTR”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_REARR_USE, TG_NN_OVER_FEATURES_USE]
Description: “Hitweigt is a variant of text relevance in which the weights of all hits are considered equal (i.e., they do not take into account premiums for title and word proximity). At the same time, the corresponding hits must pass the restrictions of the syntactic wizard, i.e. we can assume that the TRhitw factor is 0 if and only if SoftAndOk is 0”
Authors: [“gulin”, “leo”]
Responsibles: [“gulin”, “leo”]
}
Factor {
Index: 17
CppName: “FI_LONG_QUERY”
Name: “LongQuery”
Group: “Query”
Tags: [TG_QUERY_ONLY, TG_DYNAMIC, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_L3_OVERWRITE, TG_NN_OVER_FEATURES_USE]
Description: “The sum of idf query words. The name does not reflect the essence: for example, for the query ‘Gadyach’ this factor will be greater than for the query ‘Moscow Peter Yekaterinburg Samara’.”
Authors: “gulin”
Responsibles: “gulin”
}
Factor {
Index: 18
CppName: “FI_PURE_TEXT”
Name: “PureText”
Tags: [TG_BINARY, TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_REARR_USE, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Wiki: “http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/LongText”
Description: “Long text without links.”
Authors: “leo”
Responsibles: [“tsimkha”, “leo”]
}
Factor {
Index: 19
CppName: “FI_ROOT”
Name: “Root”
AntiSeoUpperBound: 1.0
Tags: [TG_BINARY, TG_DOC, TG_STATIC, TG_REARR_USE, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Wiki: “http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/Root”
Description: “It’s a muzzle.”
Authors: “gulin”
Responsibles: [“gulin”, “tsimkha”]
}
# TODO(FACTORDEL-97): replace with TG_REMOVED, TG_REUSABLE and remove old formulas
Factor {
Index: 20
CppName: “FI_REMOVED_20”
Name: “Removed20”
Tags: [TG_UNUSED]
}
# TODO(FACTORDEL-97): replace with TG_REMOVED, TG_REUSABLE and remove old formulas
Factor {
Index: 21
CppName: “FI_REMOVED_21”
Name: “Removed21”
Tags: [TG_UNUSED]
}
Factor {
Index: 22
CppName: “FI_GEO”
Name: “Geo”
Tags: [TG_DYNAMIC, TG_LOCALIZED_COUNTRY, TG_HOST, TG_BINARY, TG_DEPRECATED, TG_UNDOCUMENTED, TG_OFTEN_ZERO]
Description: “Means the match between the user’s region and the site at the country level. Binary factor: 1-matches, 0-no. Based on )”
Authors: [“ark-kum”, “gulin”, “maslov”]
Responsibles: [“ark-kum”, “gulin”, “maslov”]
}
Factor {
Index: 23
CppName: “FI_SUBQUERY_THEME_MATCH”
Name: “SubqueryThMatch”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_THEME_CLASSIF, TG_UNDOCUMENTED, TG_L2, TG_DEPRECATED]
Description: “Coincidence of the thematic spectrums of the query and the document. The subject of the query is the result of the work ((http://wiki.yandex-team.ru/EvgenijjKroxalev/subquery SubquerySearch sorcerer’s rules)) The subject of the document is taken from the Yandex catalog”
Authors: [“abokov”, “ekrokhalev”, “gulin”]
Responsibles: [“gulin”, “lamo”]
}
Factor {
Index: 24
CppName: “FI_SR”
Name: “SR”
Tags: [TG_DOC, TG_STATIC, TG_TRANS, TG_UNDOCUMENTED, TG_UNUSED]
Description: “Complex static rank, assembled from static components using a separate formula ((http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/#oftnd1 *)).”
Authors: [“gulin”, “somov”]
Responsibles: [“gulin”, “somov”]
}
Factor {
Index: 25
CppName: “FI_REFINES”
Name: “TRref”
Group: “LegacyTR”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_NN_OVER_FEATURES_USE]
Description: “A factor about the number of refines. There is a feature in the query language user refines (‘a word preceded by a percent sign’). As planned, this means something like ‘it would be nice if there was a word in the document’. The only known (( http://staff.yandex-team.ru/gulin Andrey Gulin)) a valuable use of this feature is the request [% official % site Company Name]. This feature is unknown to users, because it is not described in any documentation. that it will disappear from the query language, but words with the USER_REFINE priority will remain in the magician.The factor indicates how many maximum USER_REFINE words were simultaneously encountered within a single hit in the quorum.It is considered that they are from 0 to 3 (if > 3, then it is considered , which is 3. This number maps to the half-interval [0,1)”
Authors: [“gulin”, “leo”]
Responsibles: [“gulin”, “leo”]
}
Factor {
Index: 26
CppName: “FI_TR_BOOST”
Name: “TRboost”
Group: “Dynamic”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_NN_OVER_FEATURES_USE]
Description: “The number by which some link factors are multiplied (namely, factors number 6, 7, 47, 66) if the text relevance is 0 and there are few links”
Authors: “gulin”
Responsibles: “gulin”
}
Factor {
Index: 27
CppName: “FI_TRLR_LEMMA”
Name: “TRLRlemma”
Group: “Dynamic”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_NN_OVER_FEATURES_USE]
Description: “Lemma match occurred in text relevance.”
Authors: [“gulin”, “leo”]
Responsibles: [“gulin”, “leo”]
}
Factor {
Index: 28
CppName: “FI_TRAFGRAPH_OUT_ALL_SHARE_D”
Name: “TrafgraphOutAll_share_d”
Tags: [TG_OWNER, TG_STATIC, TG_OFTEN_ZERO, TG_COMMERCIAL, TG_NN_OVER_FEATURES_USE]
Description: “Remapped mascot feature TrafgraphOutAll_share_d”
Ticket: “SEARCHSPAM-15531”
Authors: [“bikulov”]
Responsibles: [“bikulov”, “sdormidontov”]
ImplementationTime: “2020-09-30”
}
Factor {
Index: 29
CppName: “FI_RELEV_SENTS_DSSM”
Name: “RelevSentsDssm”
Tags: [TG_DYNAMIC, TG_DOC, TG_DOC_TEXT, TG_NEURAL, TG_NN_OVER_FEATURES_USE]
Description: “Dssm model, trained on reformulations, uses sentences relevant to the query in the document part”
UseArtifact: {Name: “DssmRelevSents”}
Ticket: “FACTOR-2259”
Authors: [“padese”]
Responsibles: [“padese”]
ImplementationTime: “2020-03-03”
}
Factor {
Index: 30
CppName: “FI_FRESH_NEWS_DETECTOR_PREDICT”
Name: “FreshNewsDetectorPredict”
Ticket: “WEBFRESH-478”
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_USER, TG_FRESHNESS_USE, TG_L2, TG_QUERY_DETECTOR_PREDICT, TG_UNUSED, TG_NOT_01]
Description: “The value of the news detector calculated in the behemoth. Always 0 if the detector value is less than the threshold.”
Authors: [“alejes”, “hygge”]
Responsibles: [“alejes”, “hygge”]
MinValue: -3e+38
MaxValue: 3e+38
ImplementationTime: “2020-09-27”
}
Factor {
Index: 31
CppName: “FI_HIT_NUM_100”
Name: “LRHitNum100”
Group: “LegacyLR”
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: “The converted number of query words in all url links.”
Authors: “leshch”
Responsibles: “alsafr”
}
Factor {
Index: 32
CppName: “FI_HIT_NUM_GT_16”
Name: “LRHitNumGt16”
Group: “LegacyLR”
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_BINARY, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: “Document has LR>20 number of occurrences of query words in links > 16, pro LR factor.”
Authors: “leshch”
Responsibles: “alsafr”
}
Factor {
Index: 33
CppName: “FI_PCT_LINKS”
Name: “PctLinks”
Group: “LegacyLR”
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: “For documents with high LR – normalized link relevance without proximity, for documents with low LR 0”
Authors: “leshch”
Responsibles: “alsafr”
}
Factor {
Index: 34
CppName: “FI_HAS_LR”
Name: “HasLR”
Group: “LegacyLR”
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_BINARY, TG_REARR_USE, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_DEPRECATED]
Description: “Url high LR.”
Authors: “denplusplus”
Responsibles: “alsafr”
}
Factor {
Index: 35
CppName: “FI_LINK_QUALITY”
Name: “LinkQuality”
Tags: [TG_DOC, TG_LINK_TEXT, TG_STATIC, TG_DEPRECATED, TG_L2]
Description: “Inbound link quality (Leschiner classifier) – broken, see [405]”
Authors: “leshch”
Responsibles: “alsafr”
}
Factor {
Index: 36
CppName: “FI_ALICE_MUSIC_TRACK_TITLE_COSINE_MATCH_MAX_PREDICTION”
Name: “AliceMusicTrackTitleCosineMatchMaxPrediction”
Tags: [TG_UNUSED, TG_DYNAMIC, TG_DOC, TG_ALICE_MUSIC, TG_ANNOTATION_NOFILTER, TG_TEXT_MACHINE, TG_ALLOW_USE_FOR_ALICE]
Description: “CosineMatchMaxPrediction factor value for AliceMusic stream”
Wiki: “https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/lingboost”
Ticket: [“BUKI-2932”]
Authors: “anrodigina”
Responsibles: [“anrodigina”, “gotmanov”, “hommforever”]
ImplementationTime: “2020-03-11”
}
Factor {
Index: 37
CppName: “FI_NUM_LINKS”
Name: “NumLinks”
Wiki: “http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/NumLinks”
Tags: [TG_DOC, TG_LINK_GRAPH, TG_STATIC, TG_L2, TG_UNUSED]
Description: “Number of incoming links. Remapping.”
Responsibles: [“tsimkha”, “alsafr”]
}
Factor {
Index: 38
CppName: “FI_POPULAR_Q”
Name: “PopularQ”
DependsOn: [{Feature: [“PopularQ”], Slice: “begemot_query_factors”}]
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_REARR_USE, TG_L2, TG_DEPRECATED]
Group: “Query”
Description: “Query Popularity”
Wiki: “http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/PopularQ”
Authors: “denplusplus”
Responsibles: [“diver”, “akhropov”]
}
Factor {
Index: 39
CppName: “FI_TR_UNMAPPED”
Name: “TRUnmapped”
Group: “LegacyTR”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_NN_OVER_FEATURES_USE]
Description: “TR divided by the cube of the number of words in the query and converted by the standard remapTR.”
Authors: [“denplusplus”, “gulin”]
Responsibles: [“alsafr”, “gulin”]
}
Factor {
Index: 40
CppName: “FI_RUS_LANG”
Name: “Ruslang”
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_BINARY, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “Document language is Russian.”
Authors: [“aalekseev”, “denplusplus”]
Responsibles: “alsafr”
}
Factor {
Index: 41
CppName: “FI_ADD_TIME”
Name: “AddTime”
Tags: [TG_DATE, TG_DOC, TG_STATIC, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “The time the page was added, greater is the older document; root the time mapped to the interval [0,1] so that 3+ years is 1.”
Authors: [“aalekseev”, “denplusplus”]
Responsibles: “alsafr”
}
Factor {
Index: 42
CppName: “FI_IS_MAIN_PAGE”
Name: “IsMainPage”
Tags: [TG_DOC, TG_STATIC, TG_BINARY, TG_REARR_USE, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “If the main page of the owner (most often a second-level domain, for example xxxx.ru), then the factor is 1. For homeless people, hosting, personal blogs, etc. (for example, lifejournal, narod.ru, etc.) – third-level domains (such as xxxxx.narod.ru) will also have a factor of 1.”
Authors: [“aalekseev”, “denplusplus”]
Responsibles: “alsafr”
}
Factor {
Index: 43
CppName: “FI_ADD_TIME_MP”
Name: “AddTimeMP”
AntiSeoUpperBound: 1.0
Tags: [TG_DATE, TG_HOST, TG_STATIC, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “The time of adding the main page of the owner (host?), remaps the same as AddTime.”
Authors: [“aalekseev”, “denplusplus”]
Responsibles: “alsafr”
}
Factor {
Index: 44
CppName: “FI_ALICE_MUSIC_TRACK_TITLE_ANNOTATION_MAX_VALUE_WEIGHTED”
Name: “AliceMusicTrackTitleAnnotationMaxValueWeighted”
Tags: [TG_UNUSED, TG_DYNAMIC, TG_DOC, TG_ALICE_MUSIC, TG_ANNOTATION_NOFILTER, TG_TEXT_MACHINE, TG_ALLOW_USE_FOR_ALICE]
Description: “AnnotationMaxValueWeighted factor value for AliceMusic stream”
Wiki: “https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/lingboost”
Ticket: [“BUKI-2932”]
Authors: “anrodigina”
Responsibles: [“anrodigina”, “gotmanov”, “hommforever”]
ImplementationTime: “2020-03-11”
}
Factor {
Index: 45
CppName: “FI_URL_CLICKS_PCTR”
Name: “QueryURLClicksPCTR”
AntiSeoUpperBound: 0.6
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_REARR_USE, TG_OFTEN_ZERO, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_CLICKS_SHOWS, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Countries: CNT_RELEV
Description: “How often a given URL is clicked for a given query – CTR multiplied by a correction factor”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/Clicks#queryurldownerclickspctrfrccomboreg”
Authors: [“akhropov”, “solar”]
Responsibles: [“tarum”, “niknik”]
}
Factor {
Index: 46
CppName: “FI_TEXT_BM25”
Name: “TextBM25”
Group: “TextBM25”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “Simple BM25 by text.”
Authors: “gulin”
Responsibles: “gulin”
}
Factor {
Index: 47
CppName: “FI_LINK_BM25”
Name: “LinkBM25”
Group: [“LinkBM25”, “Dynamic”]
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_DEPRECATED]
Description: “Simple BM25 by links, link weights are not taken into account.”
Authors: “gulin”
Responsibles: “gulin”
}
Factor {
Index: 48
CppName: “FI_TLBM25”
Name: “TLBM25”
Group: “TextAndLinkBM25”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_L2, TG_DEPRECATED]
Description: “A simple BM25 for text and links at the same time.”
Authors: “gulin”
Responsibles: “gulin”
}
Factor {
Index: 49
CppName: “FI_TLP1”
Name: “TLp1”
Group: “TextAndLinkBM25”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_LINK_TEXT, TG_BINARY, TG_UNDOCUMENTED, TG_L2, TG_DEPRECATED]
Description: “All query words are in the text + links.”
Authors: “gulin”
Responsibles: “gulin”
}
Factor {
Index: 50
CppName: “FI_ADV”
Name: “Adv”
Tags: [TG_OWNER, TG_STATIC, TG_BINARY, TG_DEPRECATED, TG_OFTEN_ZERO]
Description: “There are ads on the site.”
Authors: [“aalekseev”, “denplusplus”]
Responsibles: [“sisoid”, “alsafr”]
}
Factor {
Index: 51
CppName: “FI_YANDEX_ADV”
Name: “YandexAdv”
AntiSeoUpperBound: 1.0
Tags: [TG_OWNER, TG_STATIC, TG_BINARY, TG_REARR_USE, TG_DEPRECATED, TG_OFTEN_ZERO]
Description: “There are Yandex ads on the site.”
Authors: [“aalekseev”, “denplusplus”]
Responsibles: [“sisoid”, “alsafr”]
}
Factor {
Index: 52
CppName: “FI_NO_SPAM”
Name: “No Spam”
AntiSeoUpperBound: 1.0
Tags: [TG_OWNER, TG_STATIC, TG_THEME_CLASSIF, TG_REARR_USE, TG_DEPRECATED]
Description: “Spam classifier by antispam features recognized the site as NOT(!) spam. I.e. 0=spam, 1=good.”
Authors: [“aalekseev”, “denplusplus”]
Responsibles: “alsafr”
}
Factor {
Index: 53
CppName: “FI_TEXT_PAIR”
Name: “TxtPair”
Group: “TextBM25”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “Simple BM25 by word pairs – we take all pairs of query words and count the number of their occurrences in the document text. Use the sum of word weights as the weight of the pair. Comm Does not work if the query contains a stop word”
Authors: “gulin”
Responsibles: “gulin”
}
Factor {
Index: 54
CppName: “FI_LINK_PAIR”
Name: “LnkPair”
Group: “LinkBM25”
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_L2, TG_DEPRECATED]
Description: “Same as TxtPair, but for links; link weights are not taken into account.”
Authors: “gulin”
Responsibles: “gulin”
}
Factor {
Index: 55
CppName: “FI_TEXT_BREAK”
Name: “Txt Break”
Group: “TextBM25”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “BM25 of the number of sentences in the document in which it occurs.”
Authors: “gulin”
Responsibles: “gulin”
}
Factor {
Index: 56
CppName: “FI_TEXT_HEAD”
Name: “TxtHead”
Group: “TextBM25”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “BM25 according to title only.”
Authors: “gulin”
Responsibles: “gulin”
}
Factor {
Index: 57
CppName: “FI_TEXT_HI_RELEV”
Name: “TxtHiRel”
Group: “TextBM25”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “BM25 words only with high rel beats (‘significant’, emphasis (etp)).”
Authors: “gulin”
Responsibles: “gulin”
}
# TODO(FACTORDEL-97): replace with TG_REMOVED, TG_REUSABLE and remove old formulas
Factor {
Index: 58
CppName: “FI_REMOVED_58”
Name: “Removed_58”
Tags: [TG_UNUSED]
}
Factor {
Index: 59
CppName: “FI_WORD_COUNT”
Name: “WordCount”
Group: “Query”
Tags: [TG_QUERY_ONLY, TG_DYNAMIC, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “Min(number of query words/10, 1.f)”
Authors: [“denplusplus”, “gulin”]
Responsibles: [“alsafr”, “gulin”]
}
Factor {
Index: 60
CppName: “FI_INV_WORD_COUNT”
Name: “InvWordCount”
Group: “Query”
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “1 / number_of_words_in_query.”
Authors: [“denplusplus”, “gulin”]
Responsibles: [“alsafr”, “gulin”]
}
Factor {
Index: 61
CppName: “FI_HAS_NO_TR”
Name: “HasNoTR”
Group: “LegacyTR”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_BINARY, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_NN_OVER_FEATURES_USE]
Description: “Document has no TR.”
Authors: [“denplusplus”, “gulin”]
Responsibles: [“alsafr”, “gulin”]
CanonicalValue: 1.0
}
Factor {
Index: 62
CppName: “FI_HAS_NO_LR”
Name: “HasNoLR”
Group: “LegacyLR”
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_BINARY, TG_REARR_USE, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_DEPRECATED]
Description: “Document has no LR.”
Authors: [“denplusplus”, “gulin”]
Responsibles: [“gulin”, “alsafr”]
CanonicalValue: 1.0
}
Factor {
Index: 63
CppName: “FI_HAS_NO_QUERY_URL_SHOWS”
Name: “HasNoQueryURLShows”
AntiSeoUpperBound: 1.0
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_BINARY, TG_REARR_USE, TG_OFTEN_ZERO, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_CLICKS_SHOWS, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Countries: CNT_RELEV
Description: “There is no click-through information for this url for this request 1 – request or request-url is not in the click base, 0 – request-url is in the click base”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/Clicks#hasnoqueryurldownershows”
Authors: [“denplusplus”, “kostyagin”]
Responsibles: [“tarum”, “niknik”]
CanonicalValue: 1.0
}
Factor {
Index: 64
CppName: “FI_HAS_NO_QUERY_SHOWS”
Name: “HasNoQueryShows”
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_USER_SEARCH_EXTERNAL, TG_BINARY, TG_REARR_USE, TG_OFTEN_ZERO, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_CLICKS_SHOWS, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Countries: CNT_RELEV
Description: “There is no click-through information for this request 1 – the request is not in the click base, 0 – the request is in the click base.”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/Clicks#hasnoqueryshows”
Authors: [“denplusplus”, “kostyagin”, “akhropov”]
Responsibles: [“tarum”, “niknik”]
CanonicalValue: 1.0
}
Factor {
Index: 65
CppName: “FI_HOPS”
Name: “Hops”
Tags: [TG_DOC, TG_STATIC, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “Number of url hops to bypass (such as less – closer to the snout, the smaller the value (0 – snout, 1 – can’t be reached from the snout, 0 < can be reached from the snout < 1). The normal value for the nose root is 0.0039).”
Authors: “denplusplus”
Responsibles: “alsafr”
}
Factor {
Index: 66
CppName: “FI_LOG_LR”
Name: “LogLR”
AntiSeoUpperBound: 0.85
Group: “Dynamic”
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_DEPRECATED]
Description: “Logarithm of LR mapped linearly to [0,1].”
Authors: [“denplusplus”, “karpik”]
Responsibles: “alsafr”
}
Factor {
Index: 67
CppName: “FI_TEXT_PAIR_EX”
Name: “TxtPairEx”
Group: “TextBM25”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “the presence of pairs of words in the exact form”
Responsibles: “alsafr”
}
Factor {
Index: 68
CppName: “FI_TEXT_BREAK_EX”
Name: “TxtBreakEx”
Group: “TextBM25”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “the number of sentences containing many words in the exact form”
Responsibles: “alsafr”
}
Factor {
Index: 69
CppName: “FI_TEXT_HEAD_EX”
Name: “TxtHeadEx”
Group: “TextBM25”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “the presence of words in the title in the exact form”
Responsibles: “alsafr”
}
Factor {
Index: 70
CppName: “FI_TEXT_HI_RELEV_EX”
Name: “TxtHiRelEx”
Group: “TextBM25”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “BM25 in exact shape”
Responsibles: “alsafr”
}
Factor {
Index: 71
CppName: “FI_TEXT_BM25_EX”
Name: “TxtBm25Ex”
Group: “TextBM25”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “A simple BM25 in precise shape.”
Responsibles: “alsafr”
}
Factor {
Index: 72
CppName: “FI_TEXT_PAIR_SYN”
Name: “TxtPairSy”
Group: “TextBM25”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “the presence of pairs of words, taking into account synonyms (>=TxtPair)”
Responsibles: “alsafr”
}
Factor {
Index: 73
CppName: “FI_TEXT_BRAEK_SYN”
Name: “TxtBreakSy”
Group: “TextBM25”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “the number of sentences in which there are many words, taking into account synonyms”
Responsibles: “alsafr”
}
Factor {
Index: 74
CppName: “FI_TEXT_HEAD_SYN”
Name: “TxtHeadSy”
Group: “TextBM25”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_L2, TG_REARR_USE, TG_NN_OVER_FEATURES_USE]
Description: “the presence of words in the title, taking into account synonyms”
Responsibles: “alsafr”
}
Factor {
Index: 75
CppName: “FI_TEXT_HI_RELEV_SYN”
Name: “TxtHiRelSy”
Group: “TextBM25”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “BM25 with synonyms”
Responsibles: “alsafr”
}
Factor {
Index: 76
CppName: “FI_TEXT_BM25_SYN”
Name: “TxtBm25Sy”
Group: “TextBM25”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “A simple BM25 with synonyms.”
Responsibles: “alsafr”
}
Factor {
Index: 77
CppName: “FI_QUERY_DOWNER_CLICKS_PCTR”
Name: “QueryDownerClicksPCTR”
Tags: [TG_DYNAMIC, TG_DOWNER, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_USER_SEARCH_EXTERNAL, TG_REARR_USE, TG_OFTEN_ZERO, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_CLICKS_SHOWS, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Countries: CNT_RELEV
Description: “How often the URLs of the given domainId are clicked on for the given request – CTR of the domainId multiplied by the correction factor”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/Clicks#queryurldownerclickspctrfrccomboreg”
Authors: [“akhropov”, “solar”, “denplusplus”]
Responsibles: [“tarum”, “niknik”]
}
Factor {
Index: 78
CppName: “FI_HAS_NO_QUERY_DOWNER_SHOWS”
Name: “HasNoQueryDownerShows”
Tags: [TG_DYNAMIC, TG_DOWNER, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_USER_SEARCH_EXTERNAL, TG_BINARY, TG_OFTEN_ZERO, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_CLICKS_SHOWS, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Countries: CNT_RELEV
Description: “There is no clickability information for this domainId for this request 1 – request or request-owner is not in the click base, 0 – request-owner is in the click base”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/Clicks#hasnoqueryurldownershows”
Authors: [“denplusplus”, “kostyagin”]
Responsibles: [“tarum”, “niknik”]
CanonicalValue: 1.0
}
Factor {
Index: 79
CppName: “FI_OWNER_CLICKS_PCTR”
Name: “OwnerClicksPCTR”
Tags: [TG_STATIC, TG_OWNER, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_OFTEN_ZERO, TG_L2, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_CLICKS_SHOWS, TG_2EPD4]
Description: “Clickability of the owner regardless of the request”
Wiki: “http://wiki.yandex-team.ru/YandexSearch/SearchQuality/Clicks#ownerclickspctrreg”
Authors: [“akhropov”, “maslov”]
Responsibles: [“tarum”, “niknik”]
}
Factor {
Index: 80
CppName: “FI_MEGAFON”
Name: “Megaphone”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_LINK_TEXT, TG_UNUSED]
Description: “The relative frequency of query words in links (1 – query words are often found in links, 0.3 – rarely); more precisely, the value of this factor is pessimized under the condition: TR=0 && LR=0 && (there is no link with all the words query) && (quorum not passed) && (at least one pair of query words occurs in the text)”
Responsibles: “alsafr”
}
Factor {
Index: 81
CppName: “FI_HAS_ALL_WORDS_MERGED”
Name: “XLRp0”
Group: “Xref”
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_BINARY, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_DEPRECATED]
Description: “The links contain all the words of the query”
Responsibles: “alsafr”
}
Factor {
Index: 82
CppName: “FI_HAS_ALL_WORDS_IN_LINK”
Name: “XLRp1”
Group: “Xref”
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_BINARY, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_DEPRECATED]
Description: “One link has all the words of the query”
Responsibles: “alsafr”
}
Factor {
Index: 83
CppName: “FI_PHRASE”
Name: “XLRp2”
Group: “Xref”
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_BINARY, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_DEPRECATED]
Description: “There is a link that has passed quorum”
Responsibles: “alsafr”
}
Factor {
Index: 84
CppName: “FI_GOOD_RATIO”
Name: “XLRgood”
Group: “Xref”
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_REARR_USE, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: “What proportion of links are “good””
Responsibles: “alsafr”
}
Factor {
Index: 85
CppName: “FI_MANY_BAD”
Name: “XLRmanyBad”
AntiSeoUpperBound: 1.0
Group: “Xref”
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_DEPRECATED]
Description: “How many bad links (bad = dpr = 0)”
Responsibles: “alsafr”
}
Factor {
Index: 86
CppName: “FI_LR_MAX_DPR”
Name: “XLRmaxDpr”
Group: “Xref”
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_DEPRECATED]
Description: “Max link dpr”
Responsibles: “alsafr”
}
Factor {
Index: 87
CppName: “FI_LR_TF_IDF”
Name: “XLRtfidf”
Group: “Xref”
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: “TfIdf regular TF*IDF by links. Word frequency in links is multiplied by the inverse document frequency and summed over all words, then normalized to the length of the document.”
Responsibles: “alsafr”
}
Factor {
Index: 88
CppName: “FI_LR_RELEV”
Name: “XLRrelev”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/OpisanijaFaktorov#h20931-2”
Group: “Xref”
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: “Link relevance from Gulin”
Authors: “gulin”
Responsibles: “gulin”
}
Factor {
Index: 89
CppName: “FI_LR_RELEV_200”
Name: “XLRrelev200”
Group: “Xref”
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: “Link relevance from Gulin”
Authors: “gulin”
Responsibles: “gulin”
}
Factor {
Index: 90
CppName: “FI_LR_LOG_RELEV”
Name: “XLRlogRelev”
Group: “Xref”
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: “Link relevance from Gulin”
Authors: “gulin”
Responsibles: “gulin”
}
Factor {
Index: 91
CppName: “FI_BF_EXACT”
Name: “BFexact”
Group: “BestForm”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_LINK_TEXT, TG_BINARY, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: “There is an exact form of all query words in text/links”
Responsibles: “alsafr”
}
Factor {
Index: 92
CppName: “FI_BF_LEMMA”
Name: “BFlemma”
Group: “BestForm”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_LINK_TEXT, TG_BINARY, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: “There is a lemma of all query words in text/links”
Responsibles: “alsafr”
}
Factor {
Index: 93
CppName: “FI_SOFT_AND_OK”
Name: “SoftAndOk”
Group: “Dynamic”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_BINARY, TG_UNDOCUMENTED, TG_NN_OVER_FEATURES_USE]
Description: “Document passed softand against syntax wizard restrictions. Only for documents that have text relevance. Always 1 for single-word queries.”
Responsibles: “alsafr”
}
Factor {
Index: 94
CppName: “FI_NEW_LINK_QUALITY”
Name: “NewLinkQuality”
Tags: [TG_DOC, TG_LINK_GRAPH, TG_STATIC, TG_DEPRECATED]
Description: “Inbound link quality classifier 2 – broken, see [407]”
Responsibles: “alsafr”
}
Factor {
Index: 95
CppName: “FI_UKR”
Name: “Ukrainian”
Tags: [TG_STATIC_REGINFO, TG_HOST, TG_STATIC, TG_BINARY, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “equals to one if the site has a Ukrainian geo-attribute (i.e. 1 – Ukrainian site)”
Responsibles: “alsafr”
}
Factor {
Index: 96
CppName: “FI_IS_BLOG”
Name: “Isblog”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/Klassificacionnye?v=tkd#h45859-5”
Tags: [TG_HOST, TG_STATIC, TG_BINARY, TG_REARR_USE, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “Page from blog hosting”
Authors: [“burmisha”, “zudina”]
Responsibles: [“burmisha”, “zudina”]
}
Factor {
Index: 97
CppName: “FI_IS_LJ”
Name: “IsLivejournal”
Tags: [TG_HOST, TG_STATIC, TG_BINARY, TG_REARR_USE, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “Page from livejournal.com”
Responsibles: “alsafr”
}
# TODO(FACTORDEL-56): replace with TG_REMOVED
Factor {
Index: 98
CppName: “FI_REMOVED_98”
Name: “Removed_98”
Tags: [TG_UNUSED]
}
Factor {
Index: 99
CppName: “FI_SPAM2”
Name: “Spam2”
AntiSeoUpperBound: 1.0
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/OpisanijaFaktorov#h20931-3”
Tags: [TG_OWNER, TG_STATIC, TG_THEME_CLASSIF, TG_DEPRECATED]
Description: “Alekseev’s automatic spam classifier, the probability that the site is spam (0 is not spam, 1 is spam)”
Authors: “abv”
Responsibles: “abv”
}
Factor {
Index: 100
CppName: “FI_TEXT_FEATURES”
Name: “TextFeatures”
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “The quality of the text. It is calculated according to a rather complex formula”
Responsibles: “alsafr”
}
Factor {
Index: 101
CppName: “FI_TEXT_LIKE”
Name: “TextLike”
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “Text quality (Alekseev classifier)”
Responsibles: “alsafr”
}
# TODO(FACTORDEL-56): replace with TG_REMOVED
Factor {
Index: 102
CppName: “FI_REMOVED_102”
Name: “Removed_102”
Tags: [TG_UNUSED]
}
# TODO(FACTORDEL-56): replace with TG_REMOVED
Factor {
Index: 103
CppName: “FI_REMOVED_103”
Name: “Removed_103”
Tags: [TG_UNUSED]
}
Factor {
Index: 104
CppName: “FI_YABAR_CORE_OWNER”
Name: “YaBarCoreOwner”
Tags: [TG_STATIC, TG_OWNER, TG_USER, TG_BROWSER, TG_L2, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_VISITS_ACTIVITY_DOWNLOADS]
Description: “The core of the audience of owners according to Yandex.Browsing”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/userbrowsingactions/coreaudience/”
Authors: “monster”
Responsibles: [“tarum”, “niknik”]
}
Factor {
Index: 105
CppName: “FI_YABAR_CORE_HOST”
Name: “YaBarCoreHost”
Tags: [TG_STATIC, TG_HOST, TG_USER, TG_BROWSER, TG_REARR_USE, TG_L2, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_VISITS_ACTIVITY_DOWNLOADS]
Description: “The core audience of hosts according to Yandex.Browser data”
Authors: “kostyagin”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/userbrowsingactions/coreaudience/”
Responsibles: [“tarum”, “niknik”]
}
Factor {
Index: 106
CppName: “FI_HAS_YA_BAR_CORE”
Name: “HasYaBarCore”
AntiSeoUpperBound: 1.0
Tags: [TG_STATIC, TG_HOST, TG_USER, TG_BROWSER, TG_BINARY, TG_OFTEN_ZERO, TG_L2, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_VISITS_ACTIVITY_DOWNLOADS]
Description: “Does the host have a kernel”
Authors: “kostyagin”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/userbrowsingactions/coreaudience/”
Responsibles: [“tarum”, “niknik”]
}
Factor {
Index: 107
CppName: “FI_SPAM_KARMA”
Name: “SpamKarma”
AntiSeoUpperBound: 1.0
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/OpisanijaFaktorov#h20931-4”
Tags: [TG_OWNER, TG_STATIC, TG_DEPRECATED, TG_OFTEN_ZERO]
Description: “Anti-spammer name spam karma – probability that host is spam; based on whois information”
Authors: “abv”
Responsibles: “abv”
}
Factor {
Index: 108
CppName: “FI_MUSIC_Q”
Name: “MusicQ”
DependsOn: [{Feature: [“MusicQ”], Slice: “begemot_query_factors”}]
Group: “Query”
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_BINARY, TG_REARR_USE, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_DEPRECATED]
Description: “musicality of the request. The results of the work of the sorcerer Anton Konygin.”
Responsibles: “alsafr”
UseArtifact: {Name: “MusicWizardClassificator”}
}
Factor {
Index: 109
CppName: “FI_EXACT_MATCHES”
Name: “XLExactMatches”
Group: “Xref”
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: “number of links that exactly matched the query”
Responsibles: “alsafr”
}
Factor {
Index: 110
CppName: “FI_DOC_LEN”
Name: “Doclen”
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “Document length in sentences”
Responsibles: “alsafr”
}
Factor {
Index: 111
CppName: “FI_URL_LEN”
Name: “UrlLen”
AntiSeoUpperBound: 1.0
Tags: [TG_DOC, TG_STATIC, TG_URL_TEXT, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “URL length divided by 5”
Responsibles: “alsafr”
}
Factor {
Index: 112
CppName: “FI_QUERY_NON_COMMERCIALITY”
Name: “QueryNonCommerciality”
DependsOn: [{Feature: [“QueryNonCommerciality”], Slice: “begemot_query_factors”}]
Group: “Query”
Tags: [TG_COMMERCIAL, TG_DYNAMIC, TG_QUERY_ONLY, TG_REARR_USE, TG_OFTEN_ZERO, TG_L2, TG_DEPRECATED]
Description: “Commerciality of a query from a phrase dictionary from Yandex.Direct: 0 – maximum commerciality, 1 – minimum.”
Wiki: “https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/QueryNonCommerciality”
Ticket: “SEARCHSPAM-7504”
Authors: “somov”
Responsibles: [“sisoid”, “anelyubin”]
}
Factor {
Index: 113
CppName: “FI_HOST_SIZE”
Name: “HostSize”
AntiSeoUpperBound: 1.0
Tags: [TG_HOST, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “The size of the Raskovalov host in documents without taking into account duplicates (each double is taken into account in the factor by an independent document)”
Authors: “denplusplus”
Responsibles: “alsafr”
}
Factor {
Index: 114
CppName: “FI_IS_HTML”
Name: “IsHTML”
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_BINARY, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “Document Type – HTML”
Responsibles: “alsafr”
}
Factor {
Index: 115
CppName: “FI_LINK_SPEED”
Name: “LinkSpeed”
AntiSeoUpperBound: 1.0
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/OpisanijaFaktorov#h20931-4”
Group: “Xref”
Tags: [TG_DATE, TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: “The reciprocal of the variance of the times of occurrence of links with query words”
Responsibles: “alsafr”
}
Factor {
Index: 116
CppName: “FI_TH_LR_RELEV”
Name: “XThLRrelev”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/OpisanijaFaktorov#h20931-5”
Group: “Xref”
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_THEME_CLASSIF, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: “Link relevance based on topics”
Responsibles: “alsafr”
}
Factor {
Index: 117
CppName: “FI_TH_LR_RELEV_200”
Name: “XThLRrelev200”
Group: “Xref”
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_THEME_CLASSIF, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: “Link relevance based on topics”
Responsibles: “alsafr”
}
Factor {
Index: 118
CppName: “FI_TH_LR_LOG_RELEV”
Name: “XThLRlogRelev”
Group: “Xref”
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_THEME_CLASSIF, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: “Link relevance based on topics”
Responsibles: “alsafr”
}
Factor {
Index: 119
CppName: “FI_LERF_LR_RELEV”
Name: “XLerfLRrelev”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/OpisanijaFaktorov#h20931-8”
Group: “Xref”
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: “Link relevance based on the quality of each link”
Responsibles: “alsafr”
}
Factor {
Index: 120
CppName: “FI_LERF_LR_RELEV_200”
Name: “XLerfLRrelev200”
Group: “Xref”
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: “Link relevance based on the quality of each link”
Responsibles: “alsafr”
}
Factor {
Index: 121
CppName: “FI_LERF_LR_LOG_RELEV”
Name: “XLerfLRlogRelev”
Group: “Xref”
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: “Link relevance based on the quality of each link”
Responsibles: “alsafr”
}
Factor {
Index: 122
CppName: “FI_LERF_TH_LR_LOG_RELEV”
Name: “XLerfThLRlogRelev”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/OpisanijaFaktorov#h20931-11”
Group: “Xref”
Tags: [TG_DYNAMIC, TG_LINK_TEXT, TG_THEME_CLASSIF, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: “Link relevance based on the quality of each link and the topic of each link”
Responsibles: “alsafr”
}
Factor {
Index: 123
CppName: “FI_NON_COMM_LR_LOG_RELEV”
Name: “XNonCommLRlogRelev”
AntiSeoUpperBound: 1.0
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/OpisanijaFaktorov#h20931-12”
Group: “Xref”
Tags: [TG_COMMERCIAL, TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_REARR_USE, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: “Link relevance considering the non-commercial nature of each link”
Responsibles: “alsafr”
}
Factor {
Index: 124
CppName: “FI_NON_COMM_TH_LR_LOG_RELEV”
Name: “XNonCommThLRlogRelev”
AntiSeoUpperBound: 1.0
Group: “Xref”
Tags: [TG_COMMERCIAL, TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_THEME_CLASSIF, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: “Link relevance taking into account the non-commercial nature of each link and subject matter”
Responsibles: “alsafr”
}
Factor {
Index: 125
CppName: “FI_NON_COMM_LERF_LR_LOG_RELEV”
Name: “XNonCommLerfLRlogRelev”
AntiSeoUpperBound: 1.0
Group: “Xref”
Tags: [TG_COMMERCIAL, TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_THEME_CLASSIF, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: “Link relevance considering the non-commercial nature of each link and the quality of each link”
Responsibles: “alsafr”
}
Factor {
Index: 126
CppName: “FI_NON_COMM_LERF_TH_LR_LOG_RELEV”
Name: “XNonCommLerfThLRlogRelev”
AntiSeoUpperBound: 1.0
Group: “Xref”
Tags: [TG_COMMERCIAL, TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_THEME_CLASSIF, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: “Link relevance based on the non-commercial nature of each link, the quality of each link and the topicality”
Responsibles: “alsafr”
}
Factor {
Index: 127
CppName: “FI_GEO_CITY_PROXIM”
Name: “GeoCityProxim”
AntiSeoUpperBound: 1.0
Tags: [TG_DOC, TG_DYNAMIC, TG_LOCALIZED_GEOINQUERY, TG_BINARY, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “Means the match of the region mentioned in the request and the sites found at the region level. Binary factor: 1-matches, 0-no. Based on ((http://wiki.yandex-team.ru/YandexPoisk/ClassificationSitesAndPages/Geographic/ UseInSearch for Geoclassification of Sites))”
Authors: “denplusplus”
Responsibles: “alsafr”
}
Factor {
Index: 128
CppName: “FI_LINKS_WITH_WORDS_PERCENT”
Name: “LinksWithWordsPercent”
Group: “Xref”
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_UNUSED]
Description: “Percentage of incoming links with query words”
Responsibles: “alsafr”
}
Factor {
Index: 129
CppName: “FI_LINKS_WITH_ALL_WORDS_PERCENT”
Name: “LinksWithAllWordsPercent”
Group: “Xref”
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_REARR_USE, TG_UNDOCUMENTED, TG_UNUSED]
Description: “Percentage of inbound links with all query words”
Responsibles: “alsafr”
}
Factor {
Index: 130
CppName: “FI_PORNO_QUERY”
Name: “PornoQuery”
DependsOn: [{Feature: [“PornoQuery”], Slice: “begemot_query_factors”}]
Group: “Query”
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_THEME_CLASSIF, TG_BINARY, TG_REARR_USE, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_DEPRECATED]
Description: “Does the query contain words from yweb/pornofilter/porno.query.”
Wiki: “http://wiki.yandex-team.ru//h.yandex.net/?https%3A%2F%2Ftree.yandex.ru%2Fcgi-bin%2Fcvsweb.cgi%2Farcadia%2Fyweb%2Fpornofilter%2Fporno .query”
Responsibles: “alsafr”
UseArtifact: {Name: “PornoQueryList”}
}
Factor {
Index: 131
CppName: “FI_IS_PORNO”
Name: “Isporno”
AntiSeoUpperBound: 1.0
Ticket: “BETATEST-151”
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_BINARY, TG_REARR_USE, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “porn gut document”
Responsibles: “abv”
}
Factor {
Index: 132
CppName: “FI_IS_COMM”
Name: “IsComm”
AntiSeoUpperBound: 1.0
Ticket: “BETATEST-151”
Tags: [TG_COMMERCIAL, TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_BINARY, TG_DEPRECATED, TG_OFTEN_ZERO, TG_L2]
Description: “document from commercial-intestine. Not used (deprecated)”
Comment: “Still used in formula and polynomial :(“
Responsibles: “sisoid”
}
Factor {
Index: 133
CppName: “FI_IS_FAKE”
Name: “IsFake”
AntiSeoUpperBound: 1.0
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_BINARY, TG_REARR_USE, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_NN_OVER_FEATURES_USE]
Description: “fake document”
Responsibles: “alsafr”
}
Factor {
Index: 134
CppName: “FI_IS_SEO”
Name: “IsSEO”
AntiSeoUpperBound: 1.0
Tags: [TG_COMMERCIAL, TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_BINARY, TG_DEPRECATED, TG_OFTEN_ZERO, TG_L2]
Description: “page title contains commercial language. Not used (deprecated)”
Responsibles: “alsafr”
}
Factor {
Index: 135
CppName: “FI_IS_WIKI”
Name: “IsWiki”
AntiSeoUpperBound: 1.0
Tags: [TG_HOST, TG_STATIC, TG_WIKIPEDIA, TG_BINARY, TG_REARR_USE, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “page from en.wikipedia.org”
Responsibles: “alsafr”
}
Factor {
Index: 136
CppName: “FI_IS_ESHOP”
Name: “IsEShop”
AntiSeoUpperBound: 1.0
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_THEME_CLASSIF, TG_BINARY, TG_REARR_USE, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “commercial page (Savin classifier)”
Authors: “asavin”
Responsibles: “asavin”
}
Factor {
Index: 137
CppName: “FI_GEO_REGION_PROXIM”
Name: “GeoRegionProxim”
Tags: [TG_DOC, TG_DYNAMIC, TG_LOCALIZED_GEOINQUERY, TG_BINARY, TG_REARR_USE, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Authors: “denplusplus”
Responsibles: “alsafr”
}
Factor {
Index: 138
CppName: “FI_HAS_NO_ALL_WORDS_TR_SYN”
Name: “HasNoAllWordsTRSy”
Group: “TextBM25”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_BINARY, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “the document does not contain all the words of the query (up to a synonym)”
Responsibles: “alsafr”
CanonicalValue: 1.0
}
Factor {
Index: 139
CppName: “FI_NUM_WORDS_TR_SYN”
Name: “NumWordsTRSy”
Group: “TextBM25”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “percentage of query words in the document (up to a synonym)”
Responsibles: “alsafr”
}
Factor {
Index: 140
CppName: “FI_HAS_ALL_WORDS_TR_SYN”
Name: “HasAllWordsTRSY”
Group: “TextBM25”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_BINARY, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “the document contains all the words of the query (up to a synonym)”
Responsibles: “alsafr”
}
Factor {
Index: 141
CppName: “FI_NUM_WORDS_LR”
Name: “NumWordsLR”
Group: “LinkBM25”
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_DEPRECATED]
Description: “percentage of query words in links (up to a synonym)”
Responsibles: “alsafr”
}
Factor {
Index: 142
CppName: “FI_HAS_ALL_WORDS_LR”
Name: “HasAllWordsLR”
Group: “LinkBM25”
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_BINARY, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_DEPRECATED]
Description: “the links contain all the words of the query (up to the synonym)”
Responsibles: “alsafr”
}
Factor {
Index: 143
CppName: “FI_PAY_DETECTOR_PREDICT”
Name: “PayDetectorPredict”
Ticket: “COMMERCIAL-4”
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_USER, TG_L2, TG_QUERY_DETECTOR_PREDICT, TG_NOT_01, TG_UNUSED]
Description: “The value of the commerce detector calculated in the behemoth.”
MinValue: -10
MaxValue: 10
Authors: [“alejes”, “hygge”]
Responsibles: [“alejes”, “hygge”]
ImplementationTime: “2020-08-01”
}
Factor {
Index: 144
CppName: “FI_TEXT_INV_PAIR”
Name: “TxtInvPair”
Group: “TextBM25”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “TR through query word pairs in reverse order”
Responsibles: “alsafr”
}
Factor {
Index: 145
CppName: “FI_LINK_INV_PAIR”
Name: “LnkInvPair”
Group: “LinkBM25”
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_L2, TG_DEPRECATED]
Description: “LR on pairs of query words in reverse order”
Responsibles: “alsafr”
}
Factor {
Index: 146
CppName: “FI_TEXT_SKIP_PAIR”
Name: “TxtSkipPair”
Group: “TextBM25”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “TR by pairs of query words through one word in texts”
Responsibles: “alsafr”
}
Factor {
Index: 147
CppName: “FI_LINK_SKIP_PAIR”
Name: “LnkSkipPair”
Group: “LinkBM25”
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_L2, TG_DEPRECATED]
Description: “LR by query word pairs through one word in texts”
Responsibles: “alsafr”
}
Factor {
Index: 148
CppName: “FI_NUM_WORDS_TRFM”
Name: “NumWordsTRFm”
Group: “TextBM25”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “percentage of all query words in the text (accurate to form)”
Responsibles: “alsafr”
}
Factor {
Index: 149
CppName: “FI_HAS_ALL_WORDS_TRFM”
Name: “HasAllWordsTRFm”
Group: “TextBM25”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_BINARY, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “the document contains all the words of the query (up to the form)”
Responsibles: “alsafr”
}
Factor {
Index: 150
CppName: “FI_Q_DIVERSITY”
Name: “QDiversity”
DependsOn: [{Feature: [“QDiversity”], Slice: “begemot_query_factors”}]
Group: “Query”
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_REARR_USE, TG_OFTEN_ZERO, TG_L2, TG_DEPRECATED]
Description: “The degree of centralization of the points from which the request is made”
Wiki: “http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/QDiversity”
Authors: “denplusplus”
Responsibles: [“diver”, “akhropov”]
}
Factor {
Index: 151
CppName: “FI_Q_BLOG”
Name: “Qblog”
DependsOn: [{Feature: [“QBlog”], Slice: “begemot_query_factors”}]
Group: “Query”
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_BINARY, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_DEPRECATED]
Description: “Does the query contain blog vocabulary”
Responsibles: “alsafr”
}
Factor {
Index: 152
CppName: “FI_GEO_LR_LOG_RELEV”
Name: “XGeoLRlogRelev”
AntiSeoUpperBound: 0.9
Group: “Xref”
Tags: [TG_DOC, TG_DYNAMIC, TG_LOCALIZED_COUNTRY, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: “log(LR, narrowed down to the user’s country)”
Responsibles: “alsafr”
}
Factor {
Index: 153
CppName: “FI_LERF_GEO_LR_LOG_RELEV”
Name: “XLerfGeoLRlogRelev”
Group: “Xref”
Tags: [TG_DOC, TG_DYNAMIC, TG_LOCALIZED_COUNTRY, TG_LINK_TEXT, TG_REARR_USE, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: “log(LerfLR, narrowed down to user’s country)”
Responsibles: “alsafr”
}
Factor {
Index: 154
CppName: “FI_NON_COMMERCIAL_QUERY”
Name: “NonCommercialQuery”
DependsOn: [{Feature: [“NonCommercialQuery”], Slice: “begemot_query_factors”}]
Group: “Query”
Tags: [TG_COMMERCIAL, TG_DYNAMIC, TG_QUERY_ONLY, TG_BINARY, TG_REARR_USE, TG_OFTEN_ZERO, TG_L2, TG_DEPRECATED]
Description: “Binary non-commerciality of the query: QueryNonCommerciality > 0.965.”
Wiki: “https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/QueryNonCommerciality”
Ticket: “SEARCHSPAM-7504”
Responsibles: [“sisoid”, “anelyubin”]
}
Factor {
Index: 155
CppName: “FI_EXACT_MATCHES_MAP”
Name: “XLExactMatchesMap”
Group: “Xref”
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_DEPRECATED]
Description: “Number of links matching query text (another remap)”
Responsibles: “alsafr”
}
Factor {
Index: 156
CppName: “FI_LERF_NORM_LR_LOG_RELEV”
Name: “XLerfNormLRlogRelev”
Group: “Xref”
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: “XLerfLRlogRelev (normalized to the sum of the Lerf weights of all links, not the sum of their original weights)”
Responsibles: “alsafr”
}
Factor {
Index: 157
CppName: “FI_NON_COMM_NORM_LR_LOG_RELEV”
Name: “XNonCommNormLRlogRelev”
Group: “Xref”
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: “XNonCommLRlogRelev (normalized to the sum of the NonComm weights of all links, not the sum of their original weights)”
Responsibles: “alsafr”
}
Factor {
Index: 158
CppName: “FI_NON_COMM_TH_NORM_LR_LOG_RELEV”
Name: “XNonCommThNormLRlogRelev”
Group: “Xref”
Tags: [TG_COMMERCIAL, TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: “Link relevance taking into account the non-commercial nature of each link and subject matter”
Responsibles: “alsafr”
}
Factor {
Index: 159
CppName: “FI_NON_COMM_LERF_NORM_LR_LOG_RELEV”
Name: “XNonCommLerfNormLRlogRelev”
Group: “Xref”
Tags: [TG_COMMERCIAL, TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: “XNonCommLerfNormLRlogRelev (normalized to the sum of the NonCommLerf weights of all links, not the sum of their original weights)”
Responsibles: “alsafr”
}
Factor {
Index: 160
CppName: “FI_NON_COMM_LERF_TH_NORM_LR_LOG_RELEV”
Name: “XNonCommLerfThNormLRlogRelev”
Group: “Xref”
Tags: [TG_COMMERCIAL, TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: “Link relevance based on the non-commercial nature of each link, the quality of each link and the topicality”
Responsibles: “alsafr”
}
Factor {
Index: 161
CppName: “FI_NEVASCA1”
Name: “Nevasca1”
Tags: [TG_OWNER, TG_STATIC, TG_DEPRECATED, TG_OFTEN_ZERO]
Description: “Not used Content Duplicate. Host ‘goodness’ (from 0 to 1) calculated based on how many and which hosts are borrowing content from this host.”
Authors: “antonovvk”
Responsibles: “antonovvk”
}
Factor {
Index: 162
CppName: “FI_NEVASCA2”
Name: “Nevasca2”
Tags: [TG_OWNER, TG_STATIC, TG_DEPRECATED]
Description: “Not used Content duplication. Host ‘Badness’ (0 to 1) is proportional to the number of secondary content on the host. Host ‘Badness’ (0 to 1) is proportional to the number of secondary content on the host.”
Authors: “antonovvk”
Responsibles: “antonovvk”
}
Factor {
Index: 163
CppName: “FI_LINK_AGE”
Name: “Linkage”
Group: “Xref”
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: “Average age of links that contributed something to LR LinkAge=Min(log(average link age)/7, 1), 3 years taken as 1”
Responsibles: “alsafr”
}
Factor {
Index: 164
CppName: “FI_TLEN”
Name: “TLen”
AntiSeoUpperBound: 1.0
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “Length of page text in words TLen = Map(number of words, 1/400), where Map(x, y) = x*y / (1 + x*y)”
Responsibles: “alsafr”
}
Factor {
Index: 165
CppName: “FI_IS_UNREACHABLE”
Name: “IsUnreachable”
Tags: [TG_DOC, TG_STATIC, TG_BINARY, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “The page is unreachable by links from the snout.”
Authors: “denplusplus”
Responsibles: “alsafr”
}
Factor {
Index: 166
CppName: “FI_LANG_LR_LOG_RELEV”
Name: “XLangLRlogRelev”
Group: “Xref”
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: “LR considering matching language of link and query”
Responsibles: “alsafr”
}
Factor {
Index: 167
CppName: “FI_LERF_LANG_LR_LOG_RELEV”
Name: “XLerfLangLRlogRelev”
Group: “Xref”
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: “LR, taking into account the coincidence of the language of the link and the request, and cheating”
Responsibles: “alsafr”
}
Factor {
Index: 168
CppName: “FI_QUERY_URL_CLICKS_FRC”
Name: “QueryURLClicksFRC”
AntiSeoUpperBound: 0.3
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_REARR_USE, TG_OFTEN_ZERO, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_CLICKS_SHOWS, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Countries: CNT_RELEV
Description: “the ratio of the number of clicks on this URL to all clicks on the query”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/Clicks#queryurldownerclickspctrfrccomboreg”
Authors: [“lidia”, “akhropov”]
Responsibles: [“tarum”, “niknik”]
}
Factor {
Index: 169
CppName: “FI_QUERY_DOWNER_CLICKS_FRC”
Name: “QueryDownerClicksFRC”
Tags: [TG_DYNAMIC, TG_DOWNER, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_USER_SEARCH_EXTERNAL, TG_REARR_USE, TG_OFTEN_ZERO, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_CLICKS_SHOWS, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Countries: CNT_RELEV
Description: “the ratio of the number of clicks on the given domainId to all clicks on the query”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/Clicks#queryurldownerclickspctrfrccomboreg”
Authors: [“lidia”, “akhropov”]
Responsibles: [“tarum”, “niknik”]
}
Factor {
Index: 170
CppName: “FI_QUERY_URL_CLICKS_PCTR_COPY”
Name: “QueryURLClicksPCTR_copy”
AntiSeoUpperBound: 0.42
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_REARR_USE, TG_DEPRECATED, TG_L2]
Countries: CNT_RELEV
Description: “[Bug: Factor copy 45] How often a given URL is clicked on for a given query – CTR multiplied by a correction factor”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/Clicks#queryurldownerclickspctrfrccomboreg”
Authors: [“akhropov”, “solar”]
Responsibles: [“akhropov”, “diver”]
}
Factor {
Index: 171
CppName: “FI_DOPP_URL_SESSION_CLICKS_FRC_CITY”
Name: “DoppQueryUrlSessionClicksFRCCity”
Ticket: “FACTOR-311”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/DoppQueryUrlSessionClicksFRC”
Tags: [TG_USER, TG_USER_SEARCH, TG_DYNAMIC, TG_DOC, TG_LOCALIZED_CITY, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_DOPP, TG_L2, TG_REARR_USE, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_90D, TG_USERFEAT_USF, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Description: “What part (average per session) of clicks on this request with the user’s city of urls added to it is this url. Calculated by user sessions.”
Authors: “esoloviev”
Responsibles: [“esoloviev”, “kolesov93”, “tarum”, “niknik”]
}
Factor {
Index: 172
CppName: “FI_QUERY_URL_CLICKS_PCTR_REG”
Name: “QueryURLClicksPCTR_Reg”
AntiSeoUpperBound: 0.4
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_REGION, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_REARR_USE, TG_OFTEN_ZERO, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_CLICKS_SHOWS, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Description: “How often this URL is clicked for this query – CTR multiplied by the correction factor, by small regions from relev_regions.web.txt”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/Clicks#queryurldownerclickspctrfrccomboreg”
Authors: “akhropov”
Responsibles: [“tarum”, “niknik”]
}
Factor {
Index: 173
CppName: “FI_QUERY_DOWNER_CLICKS_PCTR_REG”
Name: “QueryDOwnerClicksPCTR_Reg”
Tags: [TG_DYNAMIC, TG_DOWNER, TG_LOCALIZED_REGION, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_USER_SEARCH_EXTERNAL, TG_OFTEN_ZERO, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_CLICKS_SHOWS, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Description: “How often the URLs of the given domainId are clicked for the given request – CTR domainId multiplied by the correction factor, by small regions from relev_regions.web.txt”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/Clicks#queryurldownerclickspctrfrccomboreg”
Authors: “akhropov”
Responsibles: [“tarum”, “niknik”]
}
Factor {
Index: 174
CppName: “FI_QUERY_URL_CLICKS_FRC_REG”
Name: “QueryURLClicksFRC_Reg”
AntiSeoUpperBound: 0.25
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_REGION, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_REARR_USE, TG_OFTEN_ZERO, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_CLICKS_SHOWS, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Description: “the ratio of the number of clicks on this URL to all clicks on the request, by small regions from relev_regions.web.txt”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/Clicks#queryurldownerclickspctrfrccomboreg”
Authors: “akhropov”
Responsibles: [“tarum”, “niknik”]
}
Factor {
Index: 175
CppName: “FI_QUERY_DOWNER_CLICKS_FRC_REG”
Name: “QueryDOwnerClicksFRC_Reg”
Tags: [TG_DYNAMIC, TG_DOWNER, TG_LOCALIZED_REGION, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_USER_SEARCH_EXTERNAL, TG_REARR_USE, TG_OFTEN_ZERO, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_CLICKS_SHOWS, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Description: “the ratio of the number of clicks on the given domainId to all clicks on the request, in small regions from relev_regions.web.txt”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/Clicks#queryurldownerclickspctrfrccomboreg”
Authors: “akhropov”
Responsibles: [“tarum”, “niknik”]
}
Factor {
Index: 176
CppName: “FI_QUERY_URL_CLICKS_COMBO_REG”
Name: “QueryURLClicksCombo_Reg”
AntiSeoUpperBound: 0.5
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_REGION, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_OFTEN_ZERO, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_CLICKS_SHOWS, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Description: “Query URL Clicks Combo, by small regions from relev_regions.web.txt”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/Clicks#queryurldownerclickspctrfrccomboreg”
Authors: “akhropov”
Responsibles: [“tarum”, “niknik”]
}
Factor {
Index: 177
CppName: “FI_QUERY_DOWNER_CLICKS_COMBO_REG”
Name: “QueryDownerClicksCombo_Reg”
Tags: [TG_DYNAMIC, TG_DOWNER, TG_LOCALIZED_REGION, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_USER_SEARCH_EXTERNAL, TG_OFTEN_ZERO, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_CLICKS_SHOWS, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Description: “Query DOwner Clicks Combo, by small regions from relev_regions.web.txt”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/Clicks#queryurldownerclickspctrfrccomboreg”
Authors: “akhropov”
Responsibles: [“tarum”, “niknik”]
}
Factor {
Index: 178
CppName: “FI_CATALOG_RELEV”
Name: “XLRCatalogRelev”
AntiSeoUpperBound: 1.0
Group: “Xref”
Tags: [TG_CATALOG, TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_DEPRECATED]
Description: “LR by catalog descriptions”
Responsibles: “alsafr”
}
Factor {
Index: 179
CppName: “FI_YA_CATALOG_RELEV”
Name: “XLRYaCatalogRelev”
Group: “Xref”
Tags: [TG_CATALOG, TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_DEPRECATED]
Description: “LR for unsubscribing in Yandex.Catalog”
Responsibles: “alsafr”
}
Factor {
Index: 180
CppName: “FI_EXACT_WORD_ORDER_LEN”
Name: “ExactWordOrderLen”
Group: “CombinedSequences”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_REARR_USE, TG_UNDOCUMENTED, TG_NN_OVER_FEATURES_USE]
Description: “The length of the maximum match of forms in the text and query”
Authors: “pzuev”
Responsibles: “pzuev”
}
Factor {
Index: 181
CppName: “FI_EXACT_WORD_ORDER_WEIGHT”
Name: “ExactWordOrderWeight”
Group: “CombinedSequences”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_REARR_USE, TG_UNDOCUMENTED, TG_NN_OVER_FEATURES_USE]
Description: “The weight of the maximum match of forms in the text and query”
Authors: “pzuev”
Responsibles: “pzuev”
}
Factor {
Index: 182
CppName: “FI_WORD_ORDER_LEN”
Name: “WordOrderLen”
Group: “CombinedSequences”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_NN_OVER_FEATURES_USE]
Description: “The length of the maximum match by lemma in the text and query”
Authors: “pzuev”
Responsibles: “pzuev”
}
Factor {
Index: 183
CppName: “FI_WORD_ORDER_WEIGHT”
Name: “WordOrderWeight”
Group: “CombinedSequences”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_NN_OVER_FEATURES_USE]
Description: “The weight of the maximum match by lemma in the text and query”
Authors: “pzuev”
Responsibles: “pzuev”
}
Factor {
Index: 184
CppName: “FI_LINK_MAX_AGE”
Name: “LinkMaxAge”
Group: “Xref”
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_REARR_USE, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_DEPRECATED]
Description: “Maximum age of a significant collection of links that contributed something to LR”
Authors: “denplusplus”
Responsibles: “alsafr”
}
Factor {
Index: 185
CppName: “FI_TEXT_RELEV_ALL_WORDS_WITH_STOPS”
Name: “TRp1All”
AntiSeoUpperBound: 1.0
Group: “LegacyTR”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_BINARY, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_NN_OVER_FEATURES_USE]
Description: “Variants of relevant factors considering stop words”
Authors: “denplusplus”
Responsibles: “alsafr”
}
Factor {
Index: 186
CppName: “FI_LINK_RELEV_ALL_WORDS_WITH_STOPS”
Name: “LRp1All”
AntiSeoUpperBound: 1.0
Group: “LegacyLR”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_BINARY, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_NN_OVER_FEATURES_USE]
Description: “Variants of relevant factors considering stop words”
Authors: “denplusplus”
Responsibles: “alsafr”
}
Factor {
Index: 187
CppName: “FI_TLP1_ALL”
Name: “TLp1All”
Group: “TextAndLinkBM25”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_BINARY, TG_UNDOCUMENTED, TG_L2, TG_LINK_TEXT, TG_DEPRECATED]
Description: “Variants of relevant factors considering stop words”
Authors: “denplusplus”
Responsibles: “alsafr”
}
Factor {
Index: 188
CppName: “FI_BF_EXACT_ALL”
Name: “BFexactAll”
Group: “BestForm”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_BINARY, TG_UNDOCUMENTED, TG_LINK_TEXT, TG_DEPRECATED]
Description: “Variants of relevant factors considering stop words”
Authors: “denplusplus”
Responsibles: “alsafr”
}
Factor {
Index: 189
CppName: “FI_BF_LEMMA_ALL”
Name: “BFlemmaAll”
Group: “BestForm”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_BINARY, TG_UNDOCUMENTED, TG_LINK_TEXT, TG_DEPRECATED]
Description: “Variants of relevant factors considering stop words”
Authors: “denplusplus”
Responsibles: “alsafr”
}
Factor {
Index: 190
CppName: “FI_PASSAGE_LEGACY_TR”
Name: “PassageLegacyTR”
Group: “Dynamic”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_REARR_USE, TG_UNDOCUMENTED, TG_NN_OVER_FEATURES_USE]
Description: “TR of the best passage – how high-quality the snippet can be”
Responsibles: “alsafr”
}
Factor {
Index: 191
CppName: “FI_TEXT_BM25_ATTEN_SYN”
Name: “TxtBM25AttenSyn”
Group: “TextBM25”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “TR with discount for offer number”
Authors: “pzuev”
Responsibles: “pzuev”
}
Factor {
Index: 192
CppName: “FI_MAX_WORD_HOST_RANK”
Name: “MaxWordHostRank”
Group: “domain”
Tags: [TG_DYNAMIC, TG_DOWNER, TG_LINK_TEXT, TG_LINK_GRAPH, TG_DEPRECATED]
Description: “Host rank for the most expressed query word (usually the site name)”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/Domfeat/PWR”
Authors: “finder”
Responsibles: “akhropov”
}
Factor {
Index: 193
CppName: “FI_MAX_WORD_HOST_CLICKS”
Name: “MaxWordHostClicks”
Group: “domain”
Tags: [TG_DYNAMIC, TG_DOWNER, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_DEPRECATED]
Description: “Clickability of domAttr by the maximum expressed word. For example, for all queries that contain the word wikipedia, they click on wikipedia pages.”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/Domfeat/WHC”
Authors: “finder”
Responsibles: “akhropov”
}
Factor {
Index: 194
CppName: “FI_DOM_PHRASE_RANK”
Name: “DomPhraseRank”
Group: “domain”
Tags: [TG_DYNAMIC, TG_DOWNER, TG_LINK_TEXT, TG_LINK_GRAPH, TG_DEPRECATED]
Description: “HostRank for single words”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/Domfeat/PWR”
Authors: “finder”
Responsibles: “akhropov”
}
Factor {
Index: 195
CppName: “FI_DOM_PHRASE_CLICK_RANK”
Name: “DomPhraseClickRank”
Group: “domain”
Tags: [TG_DYNAMIC, TG_DOWNER, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_DEPRECATED]
Description: “Domain CTR by words”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/Domfeat/WHC”
Authors: “finder”
Responsibles: “akhropov”
}
Factor {
Index: 196
CppName: “FI_IS_FORUM”
Name: “IsForum”
Ticket: [“BUKI-1543”, “SEARCHSPAM-3650”]
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/IsForum”
Tags: [TG_DOC, TG_STATIC, TG_URL_TEXT, TG_BINARY, TG_REARR_USE, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “URL matches the FORUM_DETECTOR regex”
Authors: “zudina”
Responsibles: “zudina”
}
Factor {
Index: 197
CppName: “FI_ALICE_MUSIC_TRACK_TITLE_ANNOTATION_MATCH_WEIGHTED_VALUE”
Name: “AliceMusicTrackTitleAnnotationMatchWeightedValue”
Tags: [TG_UNUSED, TG_DYNAMIC, TG_DOC, TG_ALICE_MUSIC, TG_ANNOTATION_NOFILTER, TG_TEXT_MACHINE, TG_ALLOW_USE_FOR_ALICE]
Description: “AnnotationMatchWeightedValue factor value for AliceMusic stream”
Wiki: “https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/lingboost”
Ticket: [“BUKI-2932”]
Authors: “anrodigina”
Responsibles: [“anrodigina”, “gotmanov”, “hommforever”]
ImplementationTime: “2020-03-11”
}
Factor {
Index: 198
CppName: “FI_IS_OBSOLETE”
Name: “IsObsolete”
Tags: [TG_DATE, TG_DOC, TG_STATIC, TG_URL_TEXT, TG_BINARY, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “URL contains ancient date. Ancient news is recognized. Factor 1 if url contains year <=2007.”
Authors: “finder”
Responsibles: “finder”
}
Factor {
Index: 199
CppName: “FI_TR_WITH_STOPS”
Name: “TRWithStops”
AntiSeoUpperBound: 1.0
Group: “LegacyTR”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_NN_OVER_FEATURES_USE]
Description: “The weight of the maximum match of forms in the text and query”
Authors: “denplusplus”
Responsibles: “alsafr”
}
Factor {
Index: 200
CppName: “FI_LR_WITH_STOPS”
Name: “LRWithStops”
AntiSeoUpperBound: 1.0
Group: “Dynamic”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_UNUSED]
Description: “The weight of the maximum match of forms in the text and query”
Authors: “denplusplus”
Responsibles: “alsafr”
}
Factor {
Index: 201
CppName: “FI_HAS_PAYMENTS”
Name: “Payments”
AntiSeoUpperBound: 1.0
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_BINARY, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “The page contains information about ‘payment for SMS’.”
Authors: “denplusplus”
Responsibles: “alsafr”
}
Factor {
Index: 202
CppName: “FI_IS_LINK_PESSIMISED”
Name: “IsLinkPessimised”
Tags: [TG_OWNER, TG_STATIC, TG_BINARY, TG_DEPRECATED, TG_OFTEN_ZERO]
Description: “Anti-spammers pessimized the site – all dynamic link factors are reset. zerolnk.flt”
Authors: “zudina”
Responsibles: “zudina”
}
Factor {
Index: 203
CppName: “FI_ESHOP_VALUE”
Name: “EshopValue”
AntiSeoUpperBound: 1.0
Tags: [TG_COMMERCIAL, TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “Page shop”
Authors: “asavin”
Responsibles: “asavin”
}
Factor {
Index: 204
CppName: “FI_PORNO_VALUE”
Name: “PornoValue”
AntiSeoUpperBound: 1.0
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “Pornographic page”
Authors: “asavin”
Responsibles: “asavin”
}
Factor {
Index: 205
CppName: “FI_TRAFGRAPH_OUT_ALL_SHARE_M”
Name: “TrafgraphOutAll_share_m”
Tags: [TG_OWNER, TG_STATIC, TG_OFTEN_ZERO, TG_COMMERCIAL, TG_NN_OVER_FEATURES_USE]
Description: “Remapped mascot feature TrafgraphOutAll_share_m”
Ticket: “SEARCHSPAM-15531”
Authors: [“bikulov”]
Responsibles: [“bikulov”, “sdormidontov”]
ImplementationTime: “2020-09-30”
}
Factor {
Index: 206
CppName: “FI_TRAFGRAPH_OUT_ALL_SE_SHARE_D”
Name: “TrafgraphOutAllSE_share_d”
Tags: [TG_OWNER, TG_STATIC, TG_OFTEN_ZERO, TG_COMMERCIAL, TG_NN_OVER_FEATURES_USE]
Description: “Remapped mascot feature TrafgraphOutAllSE_share_d”
Ticket: “SEARCHSPAM-15531”
Authors: [“bikulov”]
Responsibles: [“bikulov”, “sdormidontov”]
ImplementationTime: “2020-09-30”
}
Factor {
Index: 207
CppName: “FI_TRAFGRAPH_OUT_ALL_SE_SHARE_M”
Name: “TrafgraphOutAllSE_share_m”
Ticket: “SEARCHSPAM-15531”
Authors: [“bikulov”]
Responsibles: [“bikulov”, “sdormidontov”]
Description: “Remapped mascot feature TrafgraphOutAllSE_share_m”
Tags: [TG_OWNER, TG_STATIC, TG_OFTEN_ZERO, TG_UNUSED, TG_UNIMPLEMENTED],
}
Factor {
Index: 208
CppName: “FI_NO_EXT_CLICKS_SHARE”
Name: “NoExtClicksShare”
Ticket: “SEARCHSPAM-15531”
Authors: [“bikulov”]
Responsibles: [“bikulov”, “sdormidontov”]
Description: “Remapped mascot feature NoExtClicksShare”
Tags: [TG_OWNER, TG_STATIC, TG_OFTEN_ZERO, TG_UNUSED, TG_UNIMPLEMENTED],
}
Factor {
Index: 209
CppName: “FI_COUNTERS_SEARCH_TRAFFIC1”
Name: “CountersSearchTraffic1”
AntiSeoUpperBound: 1.0
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/usercounteractions/Simple”
Tags: [TG_STATIC, TG_OWNER, TG_USER, TG_COUNTER, TG_UNUSED, TG_L2]
Description: “Search traffic – clicks from search engines to the site (2nd formula)”
Authors: [“amotuzov”, “denplusplus”]
Responsibles: “smikler”
}
Factor {
Index: 210
CppName: “FI_COUNTERS_SEARCH_TRAFFIC2”
Name: “CountersSearchTraffic2”
AntiSeoUpperBound: 1.0
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/usercounteractions/Simple”
Tags: [TG_STATIC, TG_OWNER, TG_USER, TG_COUNTER, TG_UNUSED, TG_L2]
Description: “Search traffic – clicks from search engines to the site (2nd formula)”
Authors: [“amotuzov”, “denplusplus”]
Responsibles: “smikler”
}
Factor {
Index: 211
CppName: “FI_DOM_PHRASE_YABAR”
Name: “DomPhraseYabar”
Group: “domain”
Tags: [TG_DYNAMIC, TG_DOWNER, TG_USER, TG_BROWSER, TG_USER_SEARCH, TG_DEPRECATED]
Description: “Transitions to the site from search engines for individual words, according to the bar”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/Domfeat/WHC”
Authors: “finder”
Responsibles: “akhropov”
}
Factor {
Index: 212
CppName: “FI_ALICE_MUSIC_ARTIST_NAME_BCLM_MIX_PLAIN_KE5”
Name: “AliceMusicArtistNameBclmMixPlainK000001”
Tags: [TG_UNUSED, TG_DYNAMIC, TG_DOC, TG_ANNOTATION_NOFILTER, TG_TEXT_MACHINE, TG_ALICE_MUSIC, TG_ALLOW_USE_FOR_ALICE]
Description: “BclmMixPlainK000001 factor value for AliceMusic stream”
Wiki: “https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/lingboost”
Ticket: [“BUKI-2932”]
Authors: “anrodigina”
Responsibles: [“anrodigina”, “gotmanov”, “hommforever”]
ImplementationTime: “2020-03-11”
}
Factor {
Index: 213
CppName: “FI_QUERY_URL_LCS”
Name: “QueryUrlLCS”
Tags: [TG_DYNAMIC, TG_DOC, TG_URL_TEXT, TG_L2, TG_NN_OVER_FEATURES_USE, TG_FORMULA_2245_DEP_2, TG_DEPRECATED]
Wiki: “http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/QueryUrlLCS”
Ticket: “FACTOR-417”
Description: “Largest common substring of url and query, normalized by url length”
Authors: [“mbusel”, “tsimkha”, “alsafr”]
Responsibles: [“mbusel”, “tsimkha”]
}
Factor {
Index: 214
CppName: “FI_ONLY_URL”
Name: “OnlyUrl”
Group: “UrlBM25”
Wiki: “http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/OnlyUrl”
Tags: [TG_DOC, TG_DYNAMIC, TG_URL_TEXT, TG_BINARY, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “All matches are only in the URL, there are no matches in the text of the page”
Authors: “denplusplus”
Responsibles: [“alsafr”, “stash93”]
}
Factor {
Index: 215
CppName: “FI_GEO_RELEV_REGION_CITY”
Name: “GeoRelevRegionCity”
AntiSeoUpperBound: 1.0
Tags: [TG_DOC, TG_DYNAMIC, TG_LOCALIZED_CITY, TG_BINARY, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Authors: “denplusplus”
Responsibles: “alsafr”
}
Factor {
Index: 216
CppName: “FI_GEO_RELEV_REGION_REGION”
Name: “GeoRelevRegionRegion”
AntiSeoUpperBound: 1.0
Tags: [TG_DOC, TG_DYNAMIC, TG_LOCALIZED_REGION, TG_BINARY, TG_REARR_USE, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Authors: “denplusplus”
Responsibles: “alsafr”
}
Factor {
Index: 217
CppName: “FI_GEO_RELEV_REGION_COUNTRY”
Name: “GeoRelevRegionCountry”
AntiSeoUpperBound: 1.0
Tags: [TG_DOC, TG_DYNAMIC, TG_LOCALIZED_COUNTRY, TG_BINARY, TG_REARR_USE, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L3_OVERWRITE, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “Three levels of coincidence between the geography of the user and the page”
Authors: “denplusplus”
Responsibles: “alsafr”
}
Factor {
Index: 218
CppName: “FI_LR_GEO_RELEV_REGION_CITY”
Name: “XLRGeoRelevRegionCity”
AntiSeoUpperBound: 1.0
Group: “Xref”
Tags: [TG_DOC, TG_DYNAMIC, TG_LOCALIZED_CITY, TG_LINK_TEXT, TG_REARR_USE, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_DEPRECATED]
Authors: “denplusplus”
Responsibles: “alsafr”
}
Factor {
Index: 219
CppName: “FI_LR_GEO_RELEV_REGION_REGION”
Name: “XLRGeoRelevRegionRegion”
AntiSeoUpperBound: 1.0
Group: “Xref”
Tags: [TG_DOC, TG_DYNAMIC, TG_LOCALIZED_REGION, TG_LINK_TEXT, TG_REARR_USE, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_DEPRECATED]
Authors: “denplusplus”
Responsibles: “alsafr”
}
Factor {
Index: 220
CppName: “FI_LR_GEO_RELEV_REGION_COUNTRY”
Name: “XLRGeoRelevRegionCountry”
AntiSeoUpperBound: 1.0
Group: “Xref”
Tags: [TG_DOC, TG_DYNAMIC, TG_LOCALIZED_COUNTRY, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_UNUSED]
Description: “Three levels of link region and query matching”
Authors: “denplusplus”
Responsibles: “alsafr”
}
Factor {
Index: 221
CppName: “FI_GEO_COUNTRY_PROXIM”
Name: “GeoCountryProxim”
Tags: [TG_DOC, TG_DYNAMIC, TG_LOCALIZED_COUNTRY, TG_BINARY, TG_REARR_USE, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “Geographic proximity”
Authors: “denplusplus”
Responsibles: “alsafr”
}
Factor {
Index: 222
CppName: “FI_IS_NAV_QUERY”
Name: “IsNavQuery”
DependsOn: [{Feature: [“IsNavQuery”], Slice: “begemot_query_factors”}]
Group: “Query”
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_NAV, TG_BINARY, TG_REARR_USE, TG_OFTEN_ZERO, TG_L2, TG_USERFEAT, TG_USERFEAT_90D, TG_DEPRECATED]
Description: “Is the query navigational based on the clickability of responses”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/IsNav”
Authors: [“akhropov”, “denplusplus”, “prs”]
Responsibles: [“tarum”, “niknik”]
UseArtifact: {Name: “IsNavTrie”}
}
Factor {
Index: 223
CppName: “FI_MAX_WORD_HOST_YABAR”
Name: “MaxWordHostYaBar”
Group: “domain”
Tags: [TG_DYNAMIC, TG_DOWNER, TG_USER, TG_BROWSER, TG_USER_SEARCH, TG_REARR_USE, TG_DEPRECATED, TG_OFTEN_ZERO]
Description: “The most characteristic query word corresponding to the site, according to the bar”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/Domfeat/WHC”
Authors: “finder”
Responsibles: “akhropov”
}
Factor {
Index: 224
CppName: “FI_FIRST_WORD_HOST_CLICKS”
Name: “FirstWordHostClicks”
Group: “domain”
Tags: [TG_DYNAMIC, TG_DOWNER, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_DEPRECATED, TG_OFTEN_ZERO]
Description: “Clickability of the host by the first word of the query. Quite often the first (last) word of the query is an explicit indication of the site on which to search for information.”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/Domfeat/WHC”
Authors: “finder”
Responsibles: “akhropov”
}
Factor {
Index: 225
CppName: “FI_ALICE_MUSIC_ARTIST_NAME_CMMATCH_TOP5_AVG_MATCH”
Name: “AliceMusicArtistNameCMMatchTop5AvgMatch”
Tags: [TG_UNUSED, TG_DYNAMIC, TG_DOC, TG_ALICE_MUSIC, TG_ANNOTATION_NOFILTER, TG_TEXT_MACHINE, TG_ALLOW_USE_FOR_ALICE]
Description: “CMMatchTop5AvgMatch factor value for AliceMusic stream”
Wiki: “https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/lingboost”
Ticket: [“BUKI-2932”]
Authors: “anrodigina”
Responsibles: [“anrodigina”, “gotmanov”, “hommforever”]
ImplementationTime: “2020-03-11”
}
Factor {
Index: 226
CppName: “FI_QUERY_DOWNER_YABAR_VISITS”
Name: “QueryDownerYabarVisits”
Tags: [TG_DYNAMIC, TG_DOWNER, TG_USER, TG_BROWSER, TG_USER_SEARCH, TG_USER_SEARCH_EXTERNAL, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_238D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_VISITS_ACTIVITY_DOWNLOADS, TG_FORMULA_2245_DEP_5, TG_DEPRECATED]
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/userbrowsingactions/”
Authors: “akhropov”
Responsibles: [“tarum”, “niknik”]
}
Factor {
Index: 227
CppName: “FI_QUERY_DOWNER_YABAR_VISITORS”
Name: “QueryDownerYabarVisitors”
Tags: [TG_DYNAMIC, TG_DOWNER, TG_USER, TG_BROWSER, TG_USER_SEARCH, TG_USER_SEARCH_EXTERNAL, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_238D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_VISITS_ACTIVITY_DOWNLOADS, TG_FORMULA_2245_DEP_5, TG_DEPRECATED]
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/userbrowsingactions/”
Authors: “akhropov”
Responsibles: [“tarum”, “niknik”]
}
Factor {
Index: 228
CppName: “FI_QUERY_DOWNER_YABAR_AVG_TIME”
Name: “QueryDownerYabarAvgTime”
Tags: [TG_DYNAMIC, TG_DOWNER, TG_USER, TG_BROWSER, TG_USER_SEARCH, TG_USER_SEARCH_EXTERNAL, TG_L2, TG_REARR_USE, TG_SAMOHOD_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_238D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_VISITS_ACTIVITY_DOWNLOADS, TG_FORMULA_2245_DEP_5, TG_DEPRECATED]
Description: “User average active continuous time spent by a user (in seconds) on host pages after clicking on a query from a search engine (the factor depends on the (query,domAttr) pair).”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/userbrowsingactions/”
Authors: “akhropov”
Responsibles: [“tarum”, “niknik”]
}
Factor {
Index: 229
CppName: “FI_QUERY_DOWNER_YABAR_AVG_TIME2”
Name: “QueryDownerYabarAvgTime2”
Tags: [TG_DYNAMIC, TG_DOWNER, TG_USER, TG_BROWSER, TG_USER_SEARCH, TG_USER_SEARCH_EXTERNAL, TG_REARR_USE, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_238D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_VISITS_ACTIVITY_DOWNLOADS, TG_FORMULA_2245_DEP_5, TG_DEPRECATED]
Description: “User average active continuous time spent by a user (in seconds) on the host pages after clicking on a request from a search engine (the factor depends on the (request,domAttr) pair). According to the Yandex.Bar/Elements/Browser internal counter”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/userbrowsingactions/”
Authors: “akhropov”
Responsibles: [“tarum”, “niknik”]
}
Factor {
Index: 230
CppName: “FI_QUERY_DOWNER_YABAR_AVG_ACTIONS”
Name: “QueryDOwnerYabarAvgActions”
Tags: [TG_DYNAMIC, TG_DOWNER, TG_USER, TG_BROWSER, TG_USER_SEARCH, TG_USER_SEARCH_EXTERNAL, TG_L2, TG_REARR_USE, TG_SAMOHOD_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_238D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_VISITS_ACTIVITY_DOWNLOADS, TG_FORMULA_2245_DEP_5, TG_DEPRECATED]
Description: “the average number of active actions (clicks, keystrokes) for users when the user is continuously on the host pages after clicking on a request from a search engine (the factor depends on the pair (request,domAttr)). . By the internal counter of Yandex.Bar/Elements /Browser”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/userbrowsingactions/”
Authors: “akhropov”
Responsibles: [“tarum”, “niknik”]
}
Factor {
Index: 231
CppName: “FI_QUERY_URL_YABAR_VISITS”
Name: “QueryUrlYabarVisits”
AntiSeoUpperBound: 1.0
Tags: [TG_DYNAMIC, TG_DOC, TG_USER, TG_BROWSER, TG_USER_SEARCH, TG_DEPRECATED, TG_L2]
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/userbrowsingactions/”
Authors: “akhropov”
Responsibles: [“akhropov”, “diver”]
}
Factor {
Index: 232
CppName: “FI_QUERY_URL_YABAR_VISITORS”
Name: “QueryUrlYabarVisitors”
AntiSeoUpperBound: 1.0
Tags: [TG_DYNAMIC, TG_DOC, TG_USER, TG_BROWSER, TG_USER_SEARCH, TG_REARR_USE, TG_DEPRECATED, TG_L2]
Description: “Number of unique visitors from search engines for a specific query”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/userbrowsingactions/”
Authors: “akhropov”
Responsibles: [“akhropov”, “diver”]
}
Factor {
Index: 233
CppName: “FI_QUERY_URL_YABAR_AVG_TIME”
Name: “QueryUrlYabarAvgTime”
AntiSeoUpperBound: 1.0
Tags: [TG_DYNAMIC, TG_DOC, TG_USER, TG_BROWSER, TG_USER_SEARCH, TG_DEPRECATED, TG_L2]
Description: “user average active continuous time (in seconds) on the page after clicking on a query from a search engine (the factor depends on the pair (query, url)).”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/userbrowsingactions/”
Authors: “akhropov”
Responsibles: [“akhropov”, “diver”]
}
Factor {
Index: 234
CppName: “FI_QUERY_URL_YABAR_AVG_TIME2”
Name: “QueryUrlYabarAvgTime2”
AntiSeoUpperBound: 1.0
Tags: [TG_DYNAMIC, TG_DOC, TG_USER, TG_BROWSER, TG_USER_SEARCH, TG_DEPRECATED, TG_L2]
Description: “User average active continuous time spent by a user (in seconds) on the page after clicking on a request from a search engine (the factor depends on the pair (request, url)). According to the Yandex.Bar / Elements / Browser internal counter”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/userbrowsingactions/”
Authors: “akhropov”
Responsibles: [“akhropov”, “diver”]
}
Factor {
Index: 235
CppName: “FI_QUERY_URL_YABAR_AVG_ACTIONS”
Name: “QueryUrlYabarAvgActions”
AntiSeoUpperBound: 1.0
Tags: [TG_DYNAMIC, TG_DOC, TG_USER, TG_BROWSER, TG_USER_SEARCH, TG_DEPRECATED, TG_L2]
Description: “Users average number of active actions (clicks, keystrokes) on the page after clicking on a query from a search engine (the factor depends on the pair (query, url))”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/userbrowsingactions/”
Authors: “akhropov”
Responsibles: [“akhropov”, “diver”]
}
Factor {
Index: 236
CppName: “FI_DSSM_BERT_DISTILL_SINSIG_MSE_BASE_REG_CHAIN”
Name: “DssmBertDistillSinsigMseBaseRegChain”
Tags: [TG_REMOVED]
Description: “A pool of PRS logs is marked up using Bert trained on sinsig. A dssm model is trained on this pool using BaseRegionChain”
UseArtifact: {Name: “DssmBertDistillSinsigMseBaseRegChain”}
Ticket: “FACTOR-2287”
Authors: [“ivaninap”, “rmplstiltskin”]
Responsibles: [“ivaninap”, “rmplstiltskin”]
ImplementationTime: “2020-02-21”
}
Factor {
Index: 237
CppName: “FI_DSSM_BERT_DISTILL_RELEVANCE_MSE_BASE_REG_CHAIN”
Name: “DssmBertDistillRelevanceMseBaseRegChain”
Tags: [TG_REMOVED]
Description: “A pool of PRS logs is marked up using Bert trained for relevance. A dssm model is trained on this pool using BaseRegionChain”
UseArtifact: {Name: “DssmBertDistillRelevanceMseBaseRegChain”}
Ticket: “FACTOR-2287”
Authors: [“ivaninap”, “rmplstiltskin”]
Responsibles: [“ivaninap”, “rmplstiltskin”]
ImplementationTime: “2020-02-21”
}
Factor {
Index: 238
CppName: “FI_ALICE_MUSIC_ARTIST_NAME_PER_WORD_CM_MAX_MATCH_MIN”
Name: “AliceMusicArtistNamePerWordCMMaxMatchMin”
Tags: [TG_UNUSED, TG_DYNAMIC, TG_DOC, TG_ALICE_MUSIC, TG_ANNOTATION_NOFILTER, TG_TEXT_MACHINE, TG_ALLOW_USE_FOR_ALICE]
Description: “PerWordCMaxMatchMin factor value for AliceMusic stream”
Wiki: “https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/lingboost”
Ticket: [“BUKI-2932”]
Authors: “anrodigina”
Responsibles: [“anrodigina”, “gotmanov”, “hommforever”]
ImplementationTime: “2020-03-11”
}
Factor {
Index: 239
CppName: “FI_ALICE_MUSIC_ARTIST_NAME_ATTENV1_BM15_K05”
Name: “AliceMusicArtistNameAttenV1_Bm15_K05”
Tags: [TG_UNUSED, TG_DYNAMIC, TG_DOC, TG_ALICE_MUSIC, TG_ANNOTATION_NOFILTER, TG_TEXT_MACHINE, TG_ALLOW_USE_FOR_ALICE]
Description: “AttenV1_Bm15_K05 factor value for AliceMusic stream”
Wiki: “https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/lingboost”
Ticket: [“BUKI-2932”]
Authors: “anrodigina”
Responsibles: [“anrodigina”, “gotmanov”, “hommforever”]
ImplementationTime: “2020-03-11”
}
Factor {
Index: 240
CppName: “FI_ALICE_MUSIC_ALBUM_TITLE_ANNOTATION_MAX_VALUE_WEIGHTED”
Name: “AliceMusicAlbumTitleAnnotationMaxValueWeighted”
Tags: [TG_UNUSED, TG_DYNAMIC, TG_DOC, TG_ALICE_MUSIC, TG_ANNOTATION_NOFILTER, TG_TEXT_MACHINE, TG_ALLOW_USE_FOR_ALICE]
Description: “AnnotationMaxValueWeighted factor value for AliceMusic stream”
Wiki: “https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/lingboost”
Ticket: [“BUKI-2932”]
Authors: “anrodigina”
Responsibles: [“anrodigina”, “gotmanov”, “hommforever”]
ImplementationTime: “2020-03-11”
}
Factor {
Index: 241
CppName: “FI_IS_FOREIGN_QUERY”
Name: “IsForeignQuery”
DependsOn: [{Feature: [“IsForeignQuery”], Slice: “begemot_query_factors”}]
Group: “Query”
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_BINARY, TG_REARR_USE, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_DEPRECATED]
Description: “Request is not in Russian”
Authors: “denplusplus”
Responsibles: “alsafr”
UseArtifact: {Name: “QueryLang”}
}
Factor {
Index: 242
CppName: “FI_IS_FOREIGN_CLUSTER”
Name: “IsForeignCluster”
Tags: [TG_DOC, TG_STATIC, TG_BINARY, TG_REARR_USE, TG_DEPRECATED, TG_OFTEN_ZERO]
Description: “document from a foreign cluster”
Responsibles: “alsafr”
}
Factor {
Index: 243
CppName: “FI_PAGE_REGION_SIZE_IN”
Name: “PageRegionSizeIn”
Tags: [TG_DOC, TG_STATIC, TG_STATIC_REGINFO, TG_UNDOCUMENTED, TG_L2, TG_L3_OVERWRITE, TG_NN_OVER_FEATURES_USE]
Description: “Page region size”
Authors: “denplusplus”
Responsibles: “alsafr”
}
Factor {
Index: 244
CppName: “FI_PAGE_REGION_INV_SIZE_IN”
Name: “PageRegionInvSizeIn”
Tags: [TG_DOC, TG_STATIC, TG_STATIC_REGINFO, TG_UNDOCUMENTED, TG_L2, TG_L3_OVERWRITE, TG_NN_OVER_FEATURES_USE]
Description: “The factor is inversely proportional to the size of the page region”
Authors: “denplusplus”
Responsibles: “alsafr”
CanonicalValue: 1.0
}
Factor {
Index: 245
CppName: “FI_QUERY_REGION_SIZE”
Name: “QueryRegionSize”
Group: “Query”
Tags: [TG_DYNAMIC, TG_LOCALIZED_CITY, TG_QUERY_ONLY, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “Request region size”
Authors: “denplusplus”
Responsibles: “alsafr”
}
Factor {
Index: 246
CppName: “FI_QUERY_REGION_INV_SIZE”
Name: “QueryRegionInvSize”
Group: “Query”
Tags: [TG_DYNAMIC, TG_LOCALIZED_CITY, TG_QUERY_ONLY, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “The factor is inversely proportional to the size of the request region”
Authors: “denplusplus”
Responsibles: “alsafr”
}
Factor {
Index: 247
CppName: “FI_GEO_GEOMETRY_PROXIM”
Name: “GeoGeometryProxim”
Tags: [TG_DOC, TG_DYNAMIC, TG_LOCALIZED_CITY, TG_UNDOCUMENTED, TG_L2, TG_REARR_USE, TG_L3_OVERWRITE, TG_NN_OVER_FEATURES_USE]
Description: “Geographical proximity of the user and the site”
Authors: “denplusplus”
Responsibles: “alsafr”
}
Factor {
Index: 248
CppName: “FI_RINGS_HOST_RANK_BADNESS_OLD”
Name: “RingsHostRankBadnessOld”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/antispam?v=181r#h58953-4”
Tags: [TG_OWNER, TG_STATIC, TG_DEPRECATED]
Description: “Characterizes the site’s promotion by link rings. The value is the share of external links that are included in link rings and link exchangers.”
Authors: [“denplusplus”, “raigorodsky”]
Responsibles: [“raigorodsky”, “alsafr”]
}
Factor {
Index: 249
CppName: “FI_YABAR_HOST_VISITORS”
Name: “YabarHostVisitors”
Tags: [TG_STATIC, TG_HOST, TG_USER, TG_BROWSER, TG_L2, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_VISITS_ACTIVITY_DOWNLOADS]
Description: “number of unique visitors, remaps exponentially”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/userbrowsingactions/#2008”
Authors: “akhropov”
Responsibles: [“tarum”, “niknik”]
}
Factor {
Index: 250
CppName: “FI_YABAR_HOST_SEARCH_TRAFFIC”
Name: “YabarHostSearchTraffic”
Tags: [TG_STATIC, TG_HOST, TG_USER, TG_BROWSER, TG_L2, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_VISITS_ACTIVITY_DOWNLOADS]
Description: “Share of traffic from search engines”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/userbrowsingactions/#2008”
Authors: “akhropov”
Responsibles: [“tarum”, “niknik”]
}
Factor {
Index: 251
CppName: “FI_YABAR_HOST_INTERNAL_TRAFFIC”
Name: “YabarHostInternalTraffic”
Tags: [TG_STATIC, TG_HOST, TG_USER, TG_BROWSER, TG_REARR_USE, TG_L2, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_VISITS_ACTIVITY_DOWNLOADS]
Description: “percentage of visits to the site not by links (typed by hand or from bookmarks)”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/userbrowsingactions/#2008”
Authors: “akhropov”
Responsibles: [“tarum”, “niknik”]
}
Factor {
Index: 252
CppName: “FI_YABAR_HOST_AVG_TIME”
Name: “YabarHostAvgTime”
Tags: [TG_STATIC, TG_HOST, TG_USER, TG_BROWSER, TG_L2, TG_REARR_USE, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_VISITS_ACTIVITY_DOWNLOADS]
Description: “user average active continuous user spent time (in seconds) on host pages”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/userbrowsingactions/#2008”
Authors: “akhropov”
Responsibles: [“tarum”, “niknik”]
}
Factor {
Index: 253
CppName: “FI_YABAR_HOST_AVG_TIME2”
Name: “YabarHostAvgTime2”
Tags: [TG_STATIC, TG_HOST, TG_USER, TG_BROWSER, TG_L2, TG_REARR_USE, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_VISITS_ACTIVITY_DOWNLOADS]
Description: “Users average active continuous time spent by a user (in seconds) on the pages of the host. According to the internal counter of Yandex.Bar/Elements/Browser”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/userbrowsingactions/#2008”
Authors: “akhropov”
Responsibles: [“tarum”, “niknik”]
}
Factor {
Index: 254
CppName: “FI_YABAR_HOST_AVG_ACTIONS”
Name: “YabarHostAvgActions”
Tags: [TG_STATIC, TG_HOST, TG_USER, TG_BROWSER, TG_L2, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_VISITS_ACTIVITY_DOWNLOADS]
Description: “User average number of active actions (clicks, keystrokes) while the user is continuously (in seconds) on the host’s pages.”
Authors: “akhropov”
Responsibles: [“tarum”, “niknik”]
}
Factor {
Index: 255
CppName: “FI_YABAR_HOST_BROWSE_RANK”
Name: “YabarHostBrowseRank”
Tags: [TG_STATIC, TG_HOST, TG_USER, TG_BROWSER, TG_L2, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_BROWSER_PAGE_RANK, TG_USERFEAT]
Description: “implementation of the algorithm described in the article ((http://wiki.yandex-team.ru//h.yandex.net/?http%3A%2F%2Fresearch.microsoft.com%2Fen-us%2Fpeople%2Ftyliu% 2Ffp032-liu.pdf http://research.microsoft.com/en-us/people/tyliu/fp032-liu.pdf))”
Authors: “akhropov”
Responsibles: [“tarum”, “niknik”]
}
Factor {
Index: 256
CppName: “FI_YABAR_URL_VISITS”
Name: “YabarUrlVisits”
Tags: [TG_STATIC, TG_DOC, TG_USER, TG_BROWSER, TG_L2, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_VISITS_ACTIVITY_DOWNLOADS]
Description: “Url traffic according to i-bar”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/YabarUrlFactors”
Authors: “akhropov”
Responsibles: [“tarum”, “niknik”]
}
Factor {
Index: 257
CppName: “FI_YABAR_URL_VISITORS”
Name: “YabarUrlVisitors”
Tags: [TG_STATIC, TG_DOC, TG_USER, TG_BROWSER, TG_L2, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_VISITS_ACTIVITY_DOWNLOADS]
Description: “Number of unique url visitors”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/YabarUrlFactors”
Authors: “akhropov”
Responsibles: [“tarum”, “niknik”]
}
Factor {
Index: 258
CppName: “FI_YABAR_URL_AVG_TIME”
Name: “YabarUrlAvgTime”
Tags: [TG_STATIC, TG_DOC, TG_USER, TG_BROWSER, TG_REARR_USE, TG_L2, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_VISITS_ACTIVITY_DOWNLOADS]
Description: “Average user time spent on the page. Calculated as the difference between adjacent transitions.”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/YabarUrlFactors”
Authors: “akhropov”
Responsibles: [“tarum”, “niknik”]
}
Factor {
Index: 259
CppName: “FI_OWNER_SATISFIED4_RATE”
Name: “OwnerSatisfied4Rate”
Ticket: “BUKI-955”
Wiki: “http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/obshayaformula/tekushhiekomponenty/OwnerSatisfied4Rate”
Tags: [TG_STATIC, TG_OWNER, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_L2, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_90D, TG_USERFEAT_USF, TG_FORMULA_2245_DEPRECATED]
Description: “This is the SEA factor = s4_r/ (k_r+10) where s4_r is the number of clicks > 180 sec, k_r is the total number of clicks. Calculated with reformulations.”
Authors: [“popescul”, “cliff”, “akhropov”, “angshu”]
Responsibles: [“tarum”, “niknik”]
}
Factor {
Index: 260
CppName: “FI_OWNER_SATISFIED4_RATE_REG”
Name: “OwnerSatisfied4Rate_Reg”
Ticket: “BUKI-955”
Wiki: “http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/obshayaformula/tekushhiekomponenty/OwnerSatisfied4Rate”
Group: “RegHostStatic”
Tags: [TG_STATIC, TG_OWNER, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_L2, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_90D, TG_USERFEAT_USF, TG_2RECEPATE_D]
Countries: CNT_RELEV
Description: “This is the SEA factor = s4_r/ (k_r+10) where s4_r is the number of clicks > 180 sec, k_r is the total number of clicks. Calculated with reformulations. Localized version”
Authors: [“popescul”, “cliff”, “akhropov”, “angshu”]
Responsibles: [“tarum”, “niknik”]
}
Factor {
Index: 261
CppName: “FI_URL_QUERY_VARIETY”
Name: “UrlQueryVariety”
Tags: [TG_STATIC, TG_DOC, TG_USER, TG_USER_SEARCH, TG_USER_EXT_DATA, TG_REARR_USE, TG_L2, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_CLICKS_SHOWS, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Description: “Degree of variety of requests that are clicked on this url”
Wiki: “https://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/Kliki#urlqueryvarietyreg”
Authors: “akhropov”
Responsibles: [“tarum”, “niknik”]
}
Factor {
Index: 262
CppName: “FI_IS_COMM_BY_KEYWORDS”
Name: “IsCommByKeywords”
Tags: [TG_STATIC, TG_DEPRECATED]
Description: “The page is commercial based on keywords. Not used (deprecated)”
Authors: “denplusplus”
Responsibles: “alsafr”
}
Factor {
Index: 263
CppName: “FI_DOC_TFIDF_SUM”
Name: “DocIdfSum_broken”
Tags: [TG_STATIC, TG_DEPRECATED, TG_L2]
Description: “Idf for various parts of the document, broken, not used”
Authors: “melton”
Responsibles: “melton”
}
Factor {
Index: 264
CppName: “FI_TITLE_IDF_SUM”
Name: “TitleIdfSum_broken”
Tags: [TG_STATIC, TG_DEPRECATED, TG_L2]
Description: “Idf for various parts of the document, broken, not used”
Authors: “melton”
Responsibles: “melton”
}
Factor {
Index: 265
CppName: “FI_HEADING_IDF_SUM”
Name: “HeadingIdfSum_broken”
Tags: [TG_STATIC, TG_DEPRECATED, TG_L2]
Description: “Idf for various parts of the document, broken, not used”
Authors: “melton”
Responsibles: “melton”
}
Factor {
Index: 266
CppName: “FI_NORMAL_TEXT_IDF_SUM”
Name: “NormalTextIdfSum_broken”
Tags: [TG_STATIC, TG_DEPRECATED, TG_L2]
Description: “Idf for various parts of the document, broken, not used”
Authors: “melton”
Responsibles: “melton”
}
Factor {
Index: 267
CppName: “FI_LR_VIDEO_RELEV”
Name: “XLRVideoRelev”
Group: “Xref”
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_DEPRECATED]
Description: “Link factor about the presence of a video on the page.”
Authors: “vnik”
Responsibles: “vnik”
}
Factor {
Index: 268
CppName: “FI_AUX_TEXT_BM25”
Name: “AuxTextBM25”
AntiSeoUpperBound: 0.8
Group: “AuxBM25”
Tags: [TG_DOC_TEXT, TG_DYNAMIC, TG_LOCALIZED_CITY, TG_REARR_USE, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_DEPRECATED]
Description: “BM25 by user region for localizable requests, for non-localizable requests in KUB – country. The texts of requests sent for regions can be viewed in relev_regions.txt in the sorcerer”
Authors: “denplusplus”
Responsibles: “alsafr”
}
Factor {
Index: 269
CppName: “FI_AUX_LINK_BM25”
Name: “AuxLinkBM25”
AntiSeoUpperBound: 0.8
Group: “AuxBM25”
Tags: [TG_DYNAMIC, TG_LOCALIZED_CITY, TG_LINK_TEXT, TG_REARR_USE, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_DEPRECATED]
Description: “Same for link relevancy”
Authors: “denplusplus”
Responsibles: “alsafr”
}
Factor {
Index: 270
CppName: “FI_COMM_LINKS_SEO_HOSTS”
Name: “CommLinksSEOHosts”
AntiSeoUpperBound: 1.0
Tags: [TG_COMMERCIAL, TG_LINK_GRAPH, TG_OWNER, TG_STATIC, TG_OFTEN_ZERO, TG_L2, TG_DEPRECATED]
Description: “The share of incoming sales links. An algorithm for recognizing commercial links has been implemented. The factor is remapped to [0,1] if the share of such links is > 50%, otherwise 0. ((http://wiki.yandex-team.ru/SvetlanaShorina/topseolinks a selection of cheated sites))”
Authors: “kvn”
Responsibles: “sisoid”
}
Factor {
Index: 271
CppName: “FI_COMM_LINKS_SEO_HOSTS_PORNO_QUERY”
Name: “CommLinksSEOHostsPornoQuery”
AntiSeoUpperBound: 1.0
Tags: [TG_COMMERCIAL, TG_LINK_GRAPH, TG_OWNER, TG_DYNAMIC, TG_THEME_CLASSIF, TG_DEPRECATED, TG_OFTEN_ZERO, TG_L2]
Description: “Previous factor multiplied by PornoQuery”
Authors: “kvn”
Responsibles: “sisoid”
}
Factor {
Index: 272
CppName: “FI_COMM_LINKS_SEO_HOSTS_NON_COMM”
Name: “CommLinksSEOHostsNonComm”
AntiSeoUpperBound: 1.0
Tags: [TG_COMMERCIAL, TG_LINK_GRAPH, TG_OWNER, TG_DYNAMIC, TG_OFTEN_ZERO, TG_L2, TG_DEPRECATED]
Description: “CommLinksSEOHosts factor multiplied by NonCommercialQuery”
Authors: “kvn”
Responsibles: “sisoid”
}
Factor {
Index: 273
CppName: “FI_TOVAR_CATEGORY_QUERY”
Name: “ProductCategoryQuery”
DependsOn: [{Feature: [“ProductCategoryQuery”], Slice: “begemot_query_factors”}]
Group: “Query”
AntiSeoUpperBound: 1.0
Tags: [TG_COMMERCIAL, TG_QUERY_ONLY, TG_DYNAMIC, TG_REARR_USE, TG_DEPRECATED, TG_OFTEN_ZERO, TG_L2]
Description: “The request mentions a product category. Not used (deprecated)”
Responsibles: “alsafr”
}
Factor {
Index: 274
CppName: “FI_TOVAR_VENDOR_QUERY”
Name: “ProductCategoryVendor”
DependsOn: [{Feature: [“ProductCategoryVendor”], Slice: “begemot_query_factors”}]
Group: “Query”
AntiSeoUpperBound: 1.0
Tags: [TG_COMMERCIAL, TG_QUERY_ONLY, TG_DYNAMIC, TG_REARR_USE, TG_DEPRECATED, TG_OFTEN_ZERO, TG_L2]
Description: “Vendor mentioned in request. Not used (deprecated)”
Responsibles: “alsafr”
}
Factor {
Index: 275
CppName: “FI_Q_DIVERSITY2”
Name: “Diversity2”
DependsOn: [{Feature: [“Diversity2”], Slice: “begemot_query_factors”}]
Group: “Query”
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_REARR_USE, TG_OFTEN_ZERO, TG_L2, TG_USERFEAT, TG_USERFEAT_90D, TG_DEPRECATED]
Description: “Geographic distribution of the request”
Wiki: “http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/Diversity2”
Authors: “denplusplus”
Responsibles: [“tarum”, “niknik”]
}
Factor {
Index: 276
CppName: “FI_NIGHT_QUERY”
Name: “NightQuery”
DependsOn: [{Feature: [“NightQuery”], Slice: “begemot_query_factors”}]
Group: “Query”
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_BINARY, TG_REARR_USE, TG_OFTEN_ZERO, TG_L2, TG_DEPRECATED]
Description: “Request is made mostly at night”
Wiki: “http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/HourDiversity”
Authors: “denplusplus”
Responsibles: [“diver”, “akhropov”]
}
Factor {
Index: 277
CppName: “FI_MORNING_QUERY”
Name: “MorningQuery”
DependsOn: [{Feature: [“MorningQuery”], Slice: “begemot_query_factors”}]
Group: “Query”
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_BINARY, TG_REARR_USE, TG_OFTEN_ZERO, TG_L2, TG_DEPRECATED]
Description: “The request is usually asked in the morning”
Wiki: “http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/HourDiversity”
Authors: “denplusplus”
Responsibles: [“diver”, “akhropov”]
}
Factor {
Index: 278
CppName: “FI_DAY_QUERY”
Name: “DayQuery”
DependsOn: [{Feature: [“DayQuery”], Slice: “begemot_query_factors”}]
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_BINARY, TG_REARR_USE, TG_L2, TG_DEPRECATED]
Group: “Query”
Description: “Request is made mostly during the day”
Wiki: “http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/HourDiversity”
Authors: “denplusplus”
Responsibles: [“diver”, “akhropov”]
}
Factor {
Index: 279
CppName: “FI_EVENING_QUERY”
Name: “EveningQuery”
DependsOn: [{Feature: [“EveningQuery”], Slice: “begemot_query_factors”}]
Group: “Query”
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_BINARY, TG_REARR_USE, TG_OFTEN_ZERO, TG_L2, TG_DEPRECATED]
Description: “Request is asked mostly in the evening”
Wiki: “http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/HourDiversity”
Authors: “denplusplus”
Responsibles: [“diver”, “akhropov”]
}
Factor {
Index: 280
CppName: “FI_HOUR_DIVERSITY”
Name: “HourDiversity”
DependsOn: [{Feature: [“HourDiversity”], Slice: “begemot_query_factors”}]
Group: “Query”
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_REARR_USE, TG_OFTEN_ZERO, TG_L2, TG_USERFEAT, TG_USERFEAT_90D, TG_DEPRECATED]
Description: “Degree of expressiveness of setting requests at different times of the day”
Wiki: “http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/HourDiversity”
Authors: “denplusplus”
Responsibles: [“tarum”, “niknik”]
}
Factor {
Index: 281
CppName: “FI_LCOR”
Name: “LCor”
Group: “Dynamic”
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_REARR_USE, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_DEPRECATED]
Description: “Characterizes the frequency of words in links. The factor is large if the word that played in link relevance is rare for links.”
Authors: “denplusplus”
Responsibles: “alsafr”
}
Factor {
Index: 282
CppName: “FI_SUBQUERY_THEME_MATCH_A”
Name: “SubqueryThMatchA”
Tags: [TG_DOC, TG_DYNAMIC, TG_THEME_CLASSIF, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_DEPRECATED]
Description: “Coincidence of the thematic spectra of the query and the document. The subject of the query is the result of the work ((http://wiki.yandex-team.ru/EvgenijjKroxalev/subquery SubquerySearch sorcerer’s rules)) The subject of the document is determined by an automatic classifier”
Authors: [“ekrokhalev”, “pyal”]
Responsibles: [“pyal”, “lamo”]
}
Factor {
Index: 283
CppName: “FI_TR_DOCQUORUM”
Name: “TRDocQuorum”
Group: “Dynamic”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: “The weight of the query words that are in the text”
Authors: “denplusplus”
Responsibles: “alsafr”
}
Factor {
Index: 284
CppName: “FI_LR_DOCQUORUM”
Name: “LRDocQuorum”
Group: “Dynamic”
Tags: [TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_UNUSED, TG_DEPRECATED]
Description: “The weight of the query words that are in the links”
Authors: “denplusplus”
Responsibles: “alsafr”
}
Factor {
Index: 285
CppName: “FI_TRLR_DOCQUORUM”
Name: “TRLRDocQuorum”
Group: “Dynamic”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: “The weight of the query words that are in the text and links”
Authors: “denplusplus”
Responsibles: “alsafr”
}
Factor {
Index: 286
CppName: “FI_OWNER_SDIFF_CLICK_ENTROPY”
Name: “OwnerSDiffClickEntropy”
Tags: [TG_STATIC, TG_OWNER, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_L2, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_CLICKS_SHOWS, TG_FORMULA_2245, TG_DEP_RECATE3]
Description: “Entropy – click distribution”
Wiki: “http://wiki.yandex-team.ru/YandexLabsDev/MLRFeatureResearch/OwnerClick”
Authors: [“cliff”, “akhropov”]
Responsibles: [“tarum”, “niknik”]
}
Factor {
Index: 287
CppName: “FI_OWNER_SDIFF_SHOW_ENTROPY”
Name: “OwnerSDiffShowEntropy”
Tags: [TG_STATIC, TG_OWNER, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_L2, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_CLICKS_SHOWS, TG_FORMULA_2245, TG_DEP_RECATE3]
Description: “Entropy – distribution of impressions”
Wiki: “http://wiki.yandex-team.ru/YandexLabsDev/MLRFeatureResearch/OwnerClick”
Authors: [“cliff”, “akhropov”]
Responsibles: [“tarum”, “niknik”]
}
Factor {
Index: 288
CppName: “FI_OWNER_SDIFF_CSRATIO_ENTROPY”
Name: “OwnerSDiffCSRatioEntropy”
Tags: [TG_STATIC, TG_OWNER, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_L2, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_CLICKS_SHOWS, TG_FORMULA_2245, TG_DEP_RECATE3]
Description: “Entropy – click/impression ratio distribution”
Wiki: “http://wiki.yandex-team.ru/YandexLabsDev/MLRFeatureResearch/OwnerClick”
Authors: [“cliff”, “akhropov”]
Responsibles: [“tarum”, “niknik”]
}
Factor {
Index: 289
CppName: “FI_PORNO_LR_LOG_RELEV”
Name: “XPornoLRlogRelev”
Group: “Xref”
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: “Document porn by link text”
Authors: “somov”
Responsibles: “somov”
}
Factor {
Index: 290
CppName: “FI_PORNO_NORM_LR_LOG_RELEV”
Name: “XPornoNormLRlogRelev”
Group: “Xref”
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_REARR_USE, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: “Document porn by link text, different normalization”
Responsibles: “alsafr”
}
Factor {
Index: 291
CppName: “FI_XPORNO_QUERY”
Name: “XPornoQuery”
DependsOn: [{Feature: [“XPornoQuery”], Slice: “begemot_query_factors”}]
Group: “Query”
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_THEME_CLASSIF, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_DEPRECATED]
Description: “Porn query classifier, different dictionary than PornoQuery”
Responsibles: “alsafr”
UseArtifact: {Name: “PornoQueryList”}
}
Factor {
Index: 292
CppName: “FI_ALICE_MUSIC_ALBUM_TITLE_ATTENV1_BM15_K05”
Name: “AliceMusicAlbumTitleAttenV1_Bm15_K05”
Tags: [TG_UNUSED, TG_DYNAMIC, TG_DOC, TG_ALICE_MUSIC, TG_ANNOTATION_NOFILTER, TG_TEXT_MACHINE, TG_ALLOW_USE_FOR_ALICE]
Description: “AttenV1_Bm15_K05 factor value for AliceMusic stream”
Wiki: “https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/lingboost”
Ticket: [“BUKI-2932”]
Authors: “anrodigina”
Responsibles: [“anrodigina”, “gotmanov”, “hommforever”]
ImplementationTime: “2020-03-11”
}
Factor {
Index: 293
CppName: “FI_GEO_COUNTRY_COUNTRY_PROXIM”
Name: “GeoCountryCountryProxim”
Tags: [TG_DYNAMIC, TG_LOCALIZED_COUNTRY, TG_HOST, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “Geographic proximity of the country of the site and the country of the request”
Authors: “denplusplus”
Responsibles: “alsafr”
}
Factor {
Index: 294
CppName: “FI_URL_DOMAIN_FRACTION”
Name: “UrlDomainFraction”
Group: “Dynamic”
Wiki: “http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/UrlTrigramFraction”
Tags: [TG_HOST, TG_DYNAMIC, TG_URL_TEXT, TG_REARR_USE, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE, TG_FORMULA_2245_DEP_2, TG_DEPRECATED]
Description: “Domain coverage with three letters from the request. (Chelyabinsk lottery – chelloto. We translate the request into transliteration, find the three letters that are covered (che, hel, lot, olo), see what percentage of all the three letters is covered)”
Authors: [“cliff”, “melton”]
Responsibles: [“tsimkha”, “melton”]
}
Factor {
Index: 295
CppName: “FI_URL_PATH_AND_PARAMS_FRACTION”
Name: “UrlPathAndParamsFraction”
Wiki: “http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/UrlTrigramFraction”
Tags: [TG_DOC, TG_DYNAMIC, TG_URL_TEXT, TG_REARR_USE, TG_L2, TG_NN_OVER_FEATURES_USE, TG_FORMULA_2245_DEP_2, TG_DEPRECATED]
Description: “Same as the previous factor, but for the entire url except for the domain”
Responsibles: [“tsimkha”, “alsafr”]
}
Factor {
Index: 296
CppName: “FI_SPECIFICAL_QUERY”
Name: “SpecificQuery”
Group: “Query”
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_BINARY, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_NN_OVER_FEATURES_USE]
Description: “The request is locally specific. The request is often reformulated with an explicit region specification. ((https://ml.yandex-team.ru/archive/thread1433892/#message1433892 more))”
Authors: “denplusplus”
Responsibles: “alsafr”
}
Factor {
Index: 297
CppName: “FI_JOKER_LEN”
Name: “Joker”
Ticket: “BUKI-705”
Group: “CombinedSequences”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_DEPRECATED]
Description: “We count text features, assuming that the title of the page is assigned to each of its sentences, i.e. the distance between the word from the title and any other word is 1 sentence. Len is the maximum ratio of words from the query encountered in some sentence of the text (with title) in relation to the length of the request Example [Kharms Circus Vertunov] for ((http://wiki.yandex-team.ru//h.yandex.net/?http%3A%2F%2Fwww.wikilivres.info%2Fwiki %2F%25D0%25A6%25D0%25B8%25D1%2580%25D0%25BA_%25D0%25A8%25D0%25B0%25D1%2580%25D0%25B4%25D0%25B0%25D0%25BC_%28%25D0%25A5%25D0 %25B0%25D1%2580%25D0%25BC%25D1%2581%29 of this document))”
Authors: “styskin”
Responsibles: “styskin”
}
Factor {
Index: 298
CppName: “FI_JOKER_WEIGHT”
Name: “Joker Weight”
Group: “CombinedSequences”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_DEPRECATED]
Description: “The ratio of the sum idf of the words found in the sentence+title to all the words.”
Responsibles: “alsafr”
}
Factor {
Index: 299
CppName: “FI_EXACT_JOKER_LEN”
Name: “ExactJokerLen”
Group: “CombinedSequences”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_DEPRECATED]
Description: “Same as JokerLen, in exact forms”
Responsibles: “alsafr”
}
Factor {
Index: 300
CppName: “FI_EXACT_JOKER_WEIGHT”
Name: “ExactJokerWeight”
Group: “CombinedSequences”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_DEPRECATED]
Description: “Same as JokerWeight, with exact shapes”
Responsibles: “alsafr”
}
Factor {
Index: 301
CppName: “FI_MORE_120_SEC_VISITS_NOT_SEARCH_SHARE”
Name: “More120SecVisitsNotSearchShare”
Tags: [TG_OWNER, TG_STATIC, TG_OFTEN_ZERO, TG_COMMERCIAL, TG_NN_OVER_FEATURES_USE]
Description: “Remapped mascot feature More120SecVisitsNotSearchShare”
Ticket: “SEARCHSPAM-15531”
Authors: [“bikulov”]
Responsibles: [“bikulov”, “sdormidontov”]
ImplementationTime: “2020-09-30”
}
Factor {
Index: 302
CppName: “FI_LINK_BREAK”
Name: “LnkBreak”
Group: “LinkBM25”
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_L2, TG_DEPRECATED]
Description: “Analogues of the corresponding text factors for links. BM25 of the number of links in which a match occurred.”
Authors: “gulin”
Responsibles: “gulin”
}
Factor {
Index: 303
CppName: “FI_LINK_BM25_EX”
Name: “LnkBm25Ex”
Group: [“LinkBM25”, “Dynamic”]
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_L2, TG_DEPRECATED]
Description: “Simple BM25 in exact form in link texts”
Responsibles: “alsafr”
}
Factor {
Index: 304
CppName: “FI_LINK_PAIR_SYN”
Name: “LnkPairSy”
Group: “LinkBM25”
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_L2, TG_DEPRECATED]
Description: “The presence of pairs of words in links, taking into account synonyms”
Responsibles: “alsafr”
}
Factor {
Index: 305
CppName: “FI_LINK_BREAK_SYN”
Name: “LnkBrkSy”
Group: “LinkBM25”
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_L2, TG_DEPRECATED]
Description: “Number of links that passed the threshold”
Responsibles: “alsafr”
}
Factor {
Index: 306
CppName: “FI_LINK_BM25_SYN”
Name: “LnkBm25Sy”
Group: [“LinkBM25”, “Dynamic”]
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_L2, TG_DEPRECATED]
Description: “Simple BM25 on links with synonyms”
Responsibles: “alsafr”
}
Factor {
Index: 307
CppName: “FI_IS_VIDEO_QUERY”
Name: “VideoQuery”
DependsOn: [{Feature: [“VideoQuery”], Slice: “begemot_query_factors”}]
Group: “Query”
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_THEME_CLASSIF, TG_BINARY, TG_REARR_USE, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_DEPRECATED]
Description: “Video request”
Responsibles: “alsafr”
}
Factor {
Index: 308
CppName: “FI_OWNER_CLICKS_PCTR_REG”
Name: “OwnerClicksPCTR_Reg”
Tags: [TG_STATIC, TG_OWNER, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_OFTEN_ZERO, TG_L2, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_CLICKS_SHOWS, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Countries: CNT_RELEV
Group: “RegHostStatic”
Description: “Click-through rate of the owner regardless of the request, separately by region”
Wiki: “http://wiki.yandex-team.ru/YandexSearch/SearchQuality/Clicks#ownerclickspctrreg”
Authors: “akhropov”
Responsibles: [“tarum”, “niknik”]
}
Factor {
Index: 309
CppName: “FI_OWNER_SDIFF_CLICK_ENTROPY_REG”
Name: “OwnerSDiffClickEntropy_Reg”
Group: “RegHostStatic”
Tags: [TG_STATIC, TG_OWNER, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_L2, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_CLICKS_SHOWS, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Countries: CNT_RELEV
Description: “Entropy – click distribution. Regionalized”
Wiki: “http://wiki.yandex-team.ru/YandexLabsDev/MLRFeatureResearch/OwnerClick”
Authors: “akhropov”
Responsibles: [“tarum”, “niknik”]
}
Factor {
Index: 310
CppName: “FI_OWNER_SDIFF_SHOW_ENTROPY_REG”
Name: “OwnerSDiffShowEntropy_Reg”
Group: “RegHostStatic”
Tags: [TG_STATIC, TG_OWNER, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_L2, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_CLICKS_SHOWS, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Countries: CNT_RELEV
Description: “Entropy – impression distribution. Regionalized”
Wiki: “http://wiki.yandex-team.ru/YandexLabsDev/MLRFeatureResearch/OwnerClick”
Authors: “akhropov”
Responsibles: [“tarum”, “niknik”]
}
Factor {
Index: 311
CppName: “FI_OWNER_SDIFF_CSRATIO_ENTROPY_REG”
Name: “OwnerSDiffCSRatioEntropy_Reg”
Group: “RegHostStatic”
Tags: [TG_STATIC, TG_OWNER, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_L2, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_CLICKS_SHOWS, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Countries: CNT_RELEV
Description: “Entropy – click/impression ratio distribution. Regionalized”
Wiki: “http://wiki.yandex-team.ru/YandexLabsDev/MLRFeatureResearch/OwnerClick”
Authors: “akhropov”
Responsibles: [“tarum”, “niknik”]
}
Factor {
Index: 312
CppName: “FI_ADULTNESS”
Name: “Adultness”
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_THEME_CLASSIF, TG_DEPRECATED, TG_OFTEN_ZERO, TG_L2]
Description: “equals 2 * NastyContent”
Wiki: “http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/Adultness”
Authors: “melton”
Responsibles: “snow”
}
Factor {
Index: 313
CppName: “FI_HOST_ADULTNESS”
Name: “Host Adult”
Tags: [TG_HOST, TG_STATIC, TG_THEME_CLASSIF, TG_DEPRECATED, TG_OFTEN_ZERO, TG_L2]
Description: “equals 2 * NastyContent”
Wiki: “http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/HostAdultness”
Responsibles: “snow”
}
Factor {
Index: 314
CppName: “FI_KC_HOST_ADULTNESS”
Name: “KCHostAdultness”
Tags: [TG_HOST, TG_STATIC, TG_THEME_CLASSIF, TG_BINARY, TG_DEPRECATED, TG_OFTEN_ZERO]
Description: “always zero”
Wiki: “http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/KCHostAdultness”
Responsibles: “snow”
}
Factor {
Index: 315
CppName: “FI_IS_COM”
Name: “Iscom”
Wiki: “http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/DomainZone”
Tags: [TG_HOST, TG_STATIC, TG_URL_TEXT, TG_BINARY, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “Domain in zone .com”
Authors: “somov”
Responsibles: [“tsimkha”, “alsafr”]
}
Factor {
Index: 316
CppName: “FI_IS_UA”
Name: “IsUa”
Wiki: “http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/DomainZone”
Tags: [TG_HOST, TG_STATIC, TG_URL_TEXT, TG_BINARY, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “Domain in .ua zone”
Authors: “somov”
Responsibles: [“tsimkha”, “alsafr”]
}
Factor {
Index: 317
CppName: “FI_IS_NOT_EN”
Name: “IsNotRu”
Wiki: “http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/DomainZone”
Tags: [TG_HOST, TG_STATIC, TG_URL_TEXT, TG_BINARY, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “The domain is not in the .ru zone”
Authors: “somov”
Responsibles: [“tsimkha”, “alsafr”]
}
Factor {
Index: 318
CppName: “FI_LR_MARKET_RELEV”
Name: “XLRMarketRelev”
AntiSeoUpperBound: 1.0
Group: “Xref”
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_DEPRECATED]
Description: “LR by links from Yandex.Market”
Authors: “gulin”
Responsibles: “gulin”
}
Factor {
Index: 319
CppName: “FI_POETRY”
Name: “Poetry”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/OpisanijaFaktorov#h20931-18”
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_REARR_USE, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “Document poetry”
Authors: “vnik”
Responsibles: “vnik”
}
Factor {
Index: 320
CppName: “FI_POETRY_QUAD”
Name: “PoetryQuad”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/OpisanijaFaktorov#h20931-18”
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_REARR_USE, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “Maximum versification of a quatrain”
Authors: “vnik”
Responsibles: “vnik”
}
Factor {
Index: 321
CppName: “FI_ENG_LANG”
Name: “EngLang”
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_BINARY, TG_REARR_USE, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “Document language is English”
Responsibles: “alsafr”
}
Factor {
Index: 322
CppName: “FI_DOC_HAS_TWO_EXACT_QUERY_PARTS”
Name: “Has2ExactQueryParts”
Group: “ExactGroups”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_BINARY, TG_REARR_USE, TG_UNDOCUMENTED, TG_NN_OVER_FEATURES_USE]
Description: “The query is completely covered by two exact match groups consisting of exact match query words in a row ((http://wiki.yandex-team.ru/poiskovajaplatforma/tr/CoverageByGroups About group coverage))”
Authors: [“finder”, “gruntova”]
Responsibles: “finder”
}
Factor {
Index: 323
CppName: “FI_DOC_HAS_LEVENSHT1_QUERY_FRAGMENT”
Name: “HasLevensht1QueryFragment”
Group: “ExactGroups”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_BINARY, TG_REARR_USE, TG_UNDOCUMENTED, TG_NN_OVER_FEATURES_USE]
Description: “There is a group of exact match query words covering the query (possibly with a word omitted, added or replaced)”
Authors: [“finder”, “gruntova”]
Responsibles: “finder”
}
Factor {
Index: 324
CppName: “FI_LARGEST_SY_INEXACT_GROUP”
Name: “LargestSyInexactGroup”
Group: “ExactGroups”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_NN_OVER_FEATURES_USE]
Description: “Proportion of the query covered by the longest group of any hits (including word forms and synonyms). Possibly with skipping, adding or replacing a word”
Authors: [“finder”, “gruntova”]
Responsibles: “finder”
}
Factor {
Index: 325
CppName: “FI_TIME_PROFILES_MATCH_WD”
Name: “TimeProfilesMatchWD”
Tags: [TG_DYNAMIC, TG_DOC, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_BINARY, TG_DEPRECATED, TG_OFTEN_ZERO]
Description: “Characterizes the proximity of time profiles of the request and documents on weekdays”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/TimeProfilesMatch”
Authors: “akorsun”
Responsibles: “alsafr”
}
Factor {
Index: 326
CppName: “FI_TIME_PROFILES_MATCH_WE”
Name: “TimeProfilesMatchWE”
Tags: [TG_DYNAMIC, TG_DOC, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_BINARY, TG_DEPRECATED, TG_OFTEN_ZERO]
Description: “Characterizes proximity of time profiles of query and documents on weekends”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/TimeProfilesMatch”
Authors: “akorsun”
Responsibles: “alsafr”
}
Factor {
Index: 327
CppName: “FI_CYR_LANG”
Name: “CyrLang”
Wiki: “https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/CyrLang”
AntiSeoUpperBound: 1.0
Tags: [TG_BINARY, TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_REARR_USE, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “Document language Cyrillic”
Responsibles: “pavelgur”
}
Factor {
Index: 328
CppName: “FI_REGIONAL_U_QUERY”
Name: “GeoRegionalityU”
DependsOn: [{Feature: [“GeoRegionalityU”], Slice: “begemot_query_factors”}]
Group: “Query”
Tags: [TG_QUERY_ONLY, TG_DYNAMIC, TG_THEME_CLASSIF, TG_DEPRECATED, TG_L2]
Description: “Request factors – the result of the work ((http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/GeoRegionality of the classifier of the geolocalization of the request))U-geo-useless – regional issuance on request is meaningless”
Responsibles: “esoloviev”
}
Factor {
Index: 329
CppName: “FI_REGIONAL_R_QUERY”
Name: “GeoRegionalityR”
DependsOn: [{Feature: [“GeoRegionalityR”], Slice: “begemot_query_factors”}]
Group: “Query”
Tags: [TG_QUERY_ONLY, TG_DYNAMIC, TG_THEME_CLASSIF, TG_DEPRECATED, TG_L2]
Description: “R-geo-relevant – regional results could be useful, but nothing more”
Authors: “esoloviev”
Responsibles: “esoloviev”
}
Factor {
Index: 330
CppName: “FI_REGIONAL_V_QUERY”
Name: “GeoRegionalityV”
DependsOn: [{Feature: [“GeoRegionalityV”], Slice: “begemot_query_factors”}]
Group: “Query”
Tags: [TG_QUERY_ONLY, TG_DYNAMIC, TG_THEME_CLASSIF, TG_DEPRECATED, TG_L2]
Description: “V- geovital – regional issuance is of fundamental importance”
Authors: “esoloviev”
Responsibles: “esoloviev”
}
Factor {
Index: 331
CppName: “FI_URL_HAS_NO_DIGITS”
Name: “UrlHasNoDigits”
Tags: [TG_DOC, TG_STATIC, TG_URL_TEXT, TG_BINARY, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “There are no numbers in the url”
Authors: “melton”
Responsibles: “melton”
}
Factor {
Index: 332
CppName: “FI_ALICE_MUSIC_TRACK_ARTIST_NAMES_ALL_WCM_MAX_MATCH”
Name: “AliceMusicTrackArtistNamesAllWcmMaxMatch”
Tags: [TG_UNUSED, TG_DYNAMIC, TG_DOC, TG_ALICE_MUSIC, TG_ANNOTATION_NOFILTER, TG_TEXT_MACHINE, TG_ALLOW_USE_FOR_ALICE]
Description: “AllWcmMaxMatch factor value for AliceMusic stream”
Wiki: “https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/lingboost”
Ticket: [“BUKI-2932”]
Authors: “anrodigina”
Responsibles: [“anrodigina”, “gotmanov”, “hommforever”]
ImplementationTime: “2020-03-11”
}
Factor {
Index: 333
CppName: “FI_ALICE_MUSIC_TRACK_ALBUM_TITLE_COSINE_MATCH_MAX_PREDICTION”
Name: “AliceMusicTrackAlbumTitleCosineMatchMaxPrediction”
Tags: [TG_UNUSED, TG_DYNAMIC, TG_DOC, TG_ALICE_MUSIC, TG_ANNOTATION_NOFILTER, TG_TEXT_MACHINE, TG_ALLOW_USE_FOR_ALICE]
Description: “CosineMatchMaxPrediction factor value for AliceMusic stream”
Wiki: “https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/lingboost”
Ticket: [“BUKI-2932”]
Authors: “anrodigina”
Responsibles: [“anrodigina”, “gotmanov”, “hommforever”]
ImplementationTime: “2020-03-11”
}
Factor {
Index: 334
CppName: “FI_SYN_S1”
Name: “SynS1”
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “They show how unnatural the text is from the point of view of the Russian language. Evaluation of how much the text of the document can be considered as generated by a synonymizer or even automatic. antispam?v=1il#h58953-2 more))”
Authors: “grechnik”
Responsibles: “greek”
}
Factor {
Index: 335
CppName: “FI_SYN_FL_REMAP1”
Name: “SynFLremap1”
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “They show how unnatural the text is from the point of view of the Russian language. Evaluation of how much the text of the document can be considered as generated by a synonymizer or even automatic. antispam?v=1il#h58953-2 more))”
Authors: “grechnik”
Responsibles: “greek”
}
Factor {
Index: 336
CppName: “FI_SYN_FL_REMAP2”
Name: “SynFLremap2”
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “They show how unnatural the text is from the point of view of the Russian language. An assessment of how much the text of the document can be considered a generated synonymizer or even automatic. antispam?v=1il#h58953-2 more))”
Authors: “grechnik”
Responsibles: “greek”
}
Factor {
Index: 337
CppName: “FI_OWNER_SESS_NORM_DUR”
Name: “OwnerSessNormDuration”
Tags: [TG_STATIC, TG_OWNER, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_REARR_USE, TG_L2, TG_NN_OVER_FEARS_USE, TG_USERFEAT, TG_USERFEAT_90D, TG_USERFEAT_USF, TG_FORMULA_2245_DEPD]
Description: “nd/k normalized time to click”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty#polzovatelskiesessii”
Authors: [“cliff”, “akhropov”, “angshu”]
Responsibles: [“tarum”, “niknik”]
}
Factor {
Index: 338
CppName: “FI_URL_SESS_NORM_DUR_RATE”
Name: “UrlSessNormDurRate”
Tags: [TG_STATIC, TG_DOC, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_REARR_USE, TG_L2, TG_NN_OVER_FEEAS_USE, TG_USERFEAT, TG_USERFEAT_90D, TG_USERFEAT_USF, TG_FORMULA_2245_DEPDTURE]
Description: “nd/i”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty#polzovatelskiesessii”
Authors: [“cliff”, “akhropov”, “angshu”]
Responsibles: [“tarum”, “niknik”]
}
Factor {
Index: 339
CppName: “FI_QUERY_DOWNER_SESS_NORM_DUR”
Name: “QueryDOwnerSessNormDuration”
Tags: [TG_DYNAMIC, TG_DOWNER, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_USER_SEARCH_EXTERNAL, TG_REARR_USE, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_90D, TG_USERFEAT_USF, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Countries: CNT_RELEV
Description: “nd/k”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty#polzovatelskiesessii”
Authors: [“cliff”, “akhropov”, “angshu”]
Responsibles: [“tarum”, “niknik”]
}
Factor {
Index: 340
CppName: “FI_QUERY_DOWNER_WEIGHT_CLICK”
Name: “QueryDOwnerWeightClick”
Tags: [TG_DYNAMIC, TG_DOWNER, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_USER_SEARCH_EXTERNAL, TG_REARR_USE, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_90D, TG_USERFEAT_USF, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Countries: CNT_RELEV
Description: “w/k”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty#polzovatelskiesessii”
Authors: [“cliff”, “akhropov”, “angshu”]
Responsibles: [“tarum”, “niknik”]
}
Factor {
Index: 341
CppName: “FI_QUERY_DOWNER_ONLY_CLICK_RATE”
Name: “QueryDOwnerOnlyClickRate”
Tags: [TG_DYNAMIC, TG_DOWNER, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_USER_SEARCH_EXTERNAL, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_90D, TG_USERFEAT_USF, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Countries: CNT_RELEV
Description: “o/i”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty#polzovatelskiesessii”
Authors: [“cliff”, “akhropov”, “angshu”]
Responsibles: [“tarum”, “niknik”]
}
Factor {
Index: 342
CppName: “FI_QUERY_DOWNER_CLICK_SUMMARY”
Name: “QueryDOwnerClickSummary”
Ticket: “BUKI-955”
Tags: [TG_DYNAMIC, TG_DOWNER, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_USER_SEARCH_EXTERNAL, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_90D, TG_USERFEAT_USF, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Countries: CNT_RELEV
Description: “matched formula”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty#polzovatelskiesessii”
Authors: [“akhropov”, “angshu”, “cliff”, “popescul”]
Responsibles: [“tarum”, “niknik”]
}
Factor {
Index: 343
CppName: “FI_QUERY_DOWNER_SATISFIED4_RATE”
Name: “QueryDOwnerSatisfied4Rate”
Ticket: “BUKI-955”
Tags: [TG_DYNAMIC, TG_DOWNER, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_USER_SEARCH_EXTERNAL, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_90D, TG_USERFEAT_USF, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Countries: CNT_RELEV
Description: “r_s4b/(r_k + 10)”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty#polzovatelskiesessii”
Authors: [“akhropov”, “angshu”, “cliff”, “popescul”]
Responsibles: [“tarum”, “niknik”]
}
Factor {
Index: 344
CppName: “FI_SYNT_QUALITY”
Name: “SynthQuality”
Wiki: “http://wiki.yandex-team.ru/PoiskovajaPlatforma/Lingvistika/SyntaxInQueries/SyntFactors/IsSynt”
Group: “Query”
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “Does the request have full parsing”
Authors: “zador”
Responsibles: “zador”
}
Factor {
Index: 345
CppName: “FI_PAGE_DATE”
Name: “PageDate”
Group: “Datetime”
Tags: [TG_DATE, TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “The date of the document that is written on the page is remapped by the square root”
Responsibles: “alsafr”
}
Factor {
Index: 346
CppName: “FI_VISITS_P_VISITORS”
Name: “VisitsPVisitors”
Tags: [TG_OWNER, TG_STATIC, TG_OFTEN_ZERO, TG_COMMERCIAL, TG_NN_OVER_FEATURES_USE]
Description: “Remapped mascot feature VisitsPVisitors”
Ticket: “SEARCHSPAM-15531”
Authors: [“bikulov”]
Responsibles: [“bikulov”, “sdormidontov”]
ImplementationTime: “2020-09-30”
}
Factor {
Index: 347
CppName: “FI_RINGS_HOST_RANK_BADNESS_2”
Name: “RingsHostRankBadness2”
Tags: [TG_LINK_GRAPH, TG_OWNER, TG_STATIC, TG_BINARY, TG_DEPRECATED]
Description: “Additional factors about the promotion of the site by link rings
Authors: [“denplusplus”, “raigorodsky”]
Responsibles: [“raigorodsky”, “alsafr”]
}
Factor {
Index: 348
CppName: “FI_RINGS_HOST_RANK_BADNESS_3”
Name: “RingsHostRankBadness3”
Tags: [TG_LINK_GRAPH, TG_OWNER, TG_STATIC, TG_DEPRECATED]
Description: “Additional factors about the promotion of the site by link rings
Authors: [“denplusplus”, “raigorodsky”]
Responsibles: [“raigorodsky”, “alsafr”]
}
Factor {
Index: 349
CppName: “FI_RINGS_HOST_RANK_BADNESS_4”
Name: “RingsHostRankBadness4”
Tags: [TG_LINK_GRAPH, TG_OWNER, TG_STATIC, TG_BINARY, TG_DEPRECATED]
Description: “Additional factors about the promotion of the site by link rings
Authors: [“denplusplus”, “raigorodsky”]
Responsibles: [“raigorodsky”, “alsafr”]
}
Factor {
Index: 350
CppName: “FI_HAS_TEXT_POS”
Name: “HasTextPos”
Wiki: “http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/HasTextPos”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_BINARY, TG_REARR_USE, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “Document has text relevance”
Authors: “denplusplus”
Responsibles: [“alsafr”, “stash93”]
}
Factor {
Index: 351
CppName: “FI_QSEGMENTS_BM25”
Name: “QSegmentsBM25”
Group: “QSegments”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_NN_OVER_FEATURES_USE]
Description: “BM25 where ‘words’ are selected query segments”
Responsibles: “alsafr”
}
Factor {
Index: 352
CppName: “FI_QSEGMENTS_WEIGHT”
Name: “QSegmentsWeight”
Group: “QSegments”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_NN_OVER_FEATURES_USE]
Description: “‘Weight’ of query segments in text”
Responsibles: “alsafr”
}
Factor {
Index: 353
CppName: “FI_SYN_BAD_WORD_PAIRS”
Name: “SynPercentBadWordPairs”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/antispam?v=186j#h58953-3”
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “Indicator of the unnaturalness of the text from the point of view of the Russian language. The number of bad pairs of words in the text, renormalized to the interval [0,1] according to the formula z/(z+10)”
Responsibles: “alsafr”
}
Factor {
Index: 354
CppName: “FI_SYN_NUM_BAD_WORD_PAIRS”
Name: “SynNumBadWordPairs”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/antispam?v=186j#h58953-3”
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “Proportion of bad pairs among all those found in the table: z/(x+1), where z is the number of bad pairs in the text, and x is the number ((http://wiki.yandex-team.ru/EvgenijjGrechnikov/TestSynonimizers 2000-relevant)) couples”
Responsibles: “alsafr”
}
Factor {
Index: 355
CppName: “FI_NUM_LATIN_LETTERS”
Name: “NumLatinLetters”
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “the number of Latin letters in the text (not counting the markup), driven into [0,1] by the formula n/(n+100)”
Authors: “grechnik”
Responsibles: “greek”
}
Factor {
Index: 356
CppName: “FI_RINGS_HOST_RANK_BADNESS_1”
Name: “RingsHostRankBadness1”
Tags: [TG_LINK_GRAPH, TG_OWNER, TG_STATIC, TG_DEPRECATED]
Description: “Additional factors about the promotion of the site by link rings
Authors: [“denplusplus”, “raigorodsky”]
Responsibles: [“raigorodsky”, “alsafr”]
}
Factor {
Index: 357
CppName: “FI_DOC_TFIDF_SUM_FIXED”
Name: “DocIdfSumFixed”
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “Previous Factors – Corrected”
Responsibles: “alsafr”
}
Factor {
Index: 358
CppName: “FI_TITLE_IDF_SUM_FIXED”
Name: “TitleIdfSumFixed”
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “Previous Factors – Corrected”
Responsibles: “alsafr”
}
Factor {
Index: 359
CppName: “FI_HEADING_IDF_SUM_FIXED”
Name: “HeadingIdfSumFixed”
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “Previous Factors – Corrected”
Responsibles: “alsafr”
}
Factor {
Index: 360
CppName: “FI_NORMAL_TEXT_IDF_SUM_FIXED”
Name: “NormalTextIdfSumFixed”
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “Previous Factors – Corrected”
Responsibles: “alsafr”
}
Factor {
Index: 361
CppName: “FI_QUERY_URL_CLICKS_COMBO”
Name: “QueryURLClicksCombo”
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_REARR_USE, TG_OFTEN_ZERO, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_90D, TG_USERFEAT_CLICKS_SHOWS, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Countries: CNT_RELEV
Description: “factor cleverly combined from FRC and pseudo-CTR”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/Clicks#queryurldownerclickspctrfrccomboreg”
Authors: [“lidia”, “akhropov”]
Responsibles: [“tarum”, “niknik”]
}
Factor {
Index: 362
CppName: “FI_QUERY_DOWNER_CLICKS_COMBO”
Name: “QueryDownerClicksCombo”
Tags: [TG_DYNAMIC, TG_DOWNER, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_USER_SEARCH_EXTERNAL, TG_OFTEN_ZERO, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_90D, TG_USERFEAT_CLICKS_SHOWS, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Countries: CNT_RELEV
Description: “factor cleverly combined from FRC and pseudo-CTR”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/Clicks#queryurldownerclickspctrfrccomboreg”
Authors: [“lidia”, “akhropov”]
Responsibles: [“tarum”, “niknik”]
}
Factor {
Index: 363
CppName: “FI_LR_AMORTIZED_BY_AGE”
Name: “LRAmortizedByAge”
Group: “Xref”
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: “Link relevancy with pessimization for a long link age”
Authors: “dremov”
Responsibles: “dremov”
}
Factor {
Index: 364
CppName: “FI_WORDS_IN_TEXT”
Name: “RusWordsInText”
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “The number of words in the text (Word – what the lemmer highlighted) is displayed in [0,1] by the formula x/(x+A)”
Authors: “grechnik”
Responsibles: “greek”
}
Factor {
Index: 365
CppName: “FI_WORDS_IN_TITLE”
Name: “RusWordsInTitle”
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “Number of Russian words in title”
Responsibles: “alsafr”
}
Factor {
Index: 366
CppName: “FI_MEAN_WORD_LENGTH”
Name: “MeanWordLength”
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “Average word length”
Responsibles: “alsafr”
}
Factor {
Index: 367
CppName: “FI_PERCENT_WORDS_IN_LINKS”
Name: “PercentWordsInLinks”
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “The percentage of the number of words inside the tag .. of the number of all words”
Responsibles: “alsafr”
}
Factor {
Index: 368
CppName: “FI_PERCENT_VISIBLE_CONTENT”
Name: “PercentVisibleContent”
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “The percentage of the number of words outside the tags (outside the brackets <>) of the number of all words”
Responsibles: “alsafr”
}
Factor {
Index: 369
CppName: “FI_PERCENT_FREQ_WORDS”
Name: “PercentFreqWords”
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “Percentage of the number of words that are the 200 most frequent words of the language, out of the total number of words in the text”
Responsibles: “alsafr”
}
Factor {
Index: 370
CppName: “FI_PERCENT_USED_FREQ_WORDS”
Name: “PercentUsedFreqWords”
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “The number of the 500 most popular words of the language used in the text, divided by 500”
Responsibles: “alsafr”
}
Factor {
Index: 371
CppName: “FI_TRIGRAMS_PROB”
Name: “TrigramsProb”
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “Logarithm of the geometric mean of the probabilities of trigrams in the text. (the probability of a trigram is the number of its occurrences in the text divided by the number of all trigrams) , displayed in [0,1] using the formula -x(x+A)”
Responsibles: “alsafr”
}
Factor {
Index: 372
CppName: “FI_TRIGRAMS_COND_PROB”
Name: “TrigramsCondProb”
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “Logarithm of the geometric mean of the conditional probabilities of trigrams. The conditional probability of a trigram is its probability divided by the probability of a bigram from the first two words”
Responsibles: “alsafr”
}
Factor {
Index: 373
CppName: “FI_DOPP_DOWNER_PCTR”
Name: “DoppDOwnerPCTR”
Tags: [TG_DYNAMIC, TG_DOWNER, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_DOPP, TG_USER_SEARCH_EXTERNAL, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_90D, TG_USERFEAT_CLICKS_SHOWS, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Countries: CNT_RELEV
Description: “An analogue of the QueryDOwnerClicksPCTR factor, differs from it in that queries are normalized by doppelgangers (details of such normalization can be found at ((http://staff.yandex-team.ru/finder by Andrey Plakhov)), code -ysite/yandex/doppelgangers )”
Authors: “finder”
Responsibles: [“tarum”, “niknik”]
}
Factor {
Index: 374
CppName: “FI_DOPP_DOWNER_PCTR_REG”
Name: “DoppDOwnerPCTR_Reg”
Tags: [TG_DYNAMIC, TG_DOWNER, TG_LOCALIZED_REGION, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_DOPP, TG_USER_SEARCH_EXTERNAL, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_90D, TG_USERFEAT_CLICKS_SHOWS, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Description: “An analogue of the QueryDOwnerClicksPCTR factor, differs from it in that queries are normalized by doppelgangers (details of such normalization can be found at ((http://staff.yandex-team.ru/finder by Andrey Plakhov)), code -ysite/yandex/doppelgangers ).localized to relev_regions.web.txt”
Authors: “finder”
Responsibles: [“tarum”, “niknik”]
}
Factor {
Index: 375
CppName: “FI_DOPP_URL_PCTR”
Name: “DoppUrlPCTR”
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_DOPP, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_90D, TG_USERFEAT_CLICKS_SHOWS, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Countries: CNT_RELEV
Description: “An analogue of the QueryUrlClicksPCTR factor, differs from it in that requests are normalized by doppelgangers (details of such normalization can be found at ((http://staff.yandex-team.ru/finder by Andrey Plakhov)), code – ysite/yandex/doppelgangers )”
Authors: “finder”
Responsibles: [“tarum”, “niknik”]
}
Factor {
Index: 376
CppName: “FI_DOPP_URL_PCTR_REG”
Name: “DoppUrlPCTR_Reg”
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_REGION, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_DOPP, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_90D, TG_USERFEAT_CLICKS_SHOWS, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Description: “An analogue of the QueryUrlClicksPCTR factor, differs from it in that requests are normalized by doppelgangers (details of such normalization can be found at ((http://staff.yandex-team.ru/finder by Andrey Plakhov)), code – ysite/yandex/doppelgangers ).localized to relev_regions.web.txt”
Authors: “finder”
Responsibles: [“tarum”, “niknik”]
}
Factor {
Index: 377
CppName: “FI_URL_BM25”
Name: “UrlBM25”
AntiSeoUpperBound: 1.0
Wiki: “http://wiki.yandex-team.ru/YandexLabsDev/MLRFeatureResearch/URLMatch”
Group: “UrlBM25”
Tags: [TG_DOC, TG_DYNAMIC, TG_URL_TEXT, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “BM25 by URL”
Authors: “denplusplus”
Responsibles: “alsafr”
}
Factor {
Index: 378
CppName: “FI_HAS_BIG_PICTURE”
Name: “HasBigPicture”
Tags: [TG_DOC, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_NN_OVER_FEATURES_USE]
Description: “There is a big picture on the page”
Responsibles: “alsafr”
}
Factor {
Index: 379
CppName: “FI_MATRIXNET”
Name: “MatrixNet”
Tags: [TG_DOC, TG_DYNAMIC, TG_TRANS, TG_NOT_01, TG_REARR_USE, TG_UNUSED, TG_L3_MODEL_VALUE]
Description: “All factors apply MatrixNet formula (TG_UNUSED – to prevent them from appearing in any formulas)”
Responsibles: “alsafr”
MinValue: -3e+38
MaxValue: 3e+38
}
Factor {
Index: 380
CppName: “FI_DATER_AGE”
Name: “Date Age”
Group: “Datetime”
Tags: [TG_DATE, TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “The difference between the current date and the date of the document determined by the dater, 1 – the date of the document is equal to the current one, 0 – the document is 10 years old or more, If the date is not defined, it is 0. Attention! ((1 – DaterAge) * 60) ^2 = page age in days.”
Authors: “velavokr”
Responsibles: “velavokr”
}
Factor {
Index: 381
CppName: “FI_HARD_PESSIMIZATION”
Name: “IsHard Pessimization”
Tags: [TG_DOC, TG_STATIC, TG_DEPRECATED, TG_OFTEN_ZERO]
Description: “hard pessimization (aka PR=0), binary factor, counted in antispam”
Authors: “zudina”
Responsibles: “zudina”
}
Factor {
Index: 382
CppName: “FI_C_IN_DEGREE_1”
Name: “CInDegree1”
Tags: [TG_LINK_GRAPH, TG_OWNER, TG_STATIC, TG_DEPRECATED, TG_UNDOCUMENTED]
Description: “Host factors determine sites wound with links – the second and third incoming degrees )”
Authors: “vakoshelev”
Responsibles: “vakoshelev”
}
Factor {
Index: 383
CppName: “FI_C_IN_DEGREE_2”
Name: “CInDegree2”
Tags: [TG_LINK_GRAPH, TG_OWNER, TG_STATIC, TG_DEPRECATED, TG_UNDOCUMENTED]
Description: “Host factors determine sites wound with links – the second and third incoming degrees )”
Authors: “vakoshelev”
Responsibles: “vakoshelev”
}
Factor {
Index: 384
CppName: “FI_NUM_NON_RUSSIAN_LINKS”
Name: “NumNonRussianLinks”
Tags: [TG_DOC, TG_LINK_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_DEPRECATED]
Description: “Number of incoming links without Russian letters. Remapping.”
Responsibles: “alsafr”
}
Factor {
Index: 385
CppName: “FI_TEXT_MAX_FORMS”
Name: “TextMaxForms”
Group: “Text Forms”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “Maximum number of forms over all query words – max over all query words number_of_forms_for_word/64”
Responsibles: “alsafr”
}
Factor {
Index: 386
CppName: “FI_TEXT_WEIGHTED_FORMS”
Name: “TextWeighted Forms”
Group: “Text Forms”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “Word weighted sum of number of shapes – sum over all query words of number_of_forms_for_word/64*word_weight; remap of the form x/(1 + x).”
Responsibles: “alsafr”
}
Factor {
Index: 387
CppName: “FI_TEXT_FORMS”
Name: “Text Forms”
Group: “Text Forms”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “Unweighted sum of number of forms – sum over all query words of number_of_forms_for_word/64/number_of_query_words”
Responsibles: “alsafr”
}
Factor {
Index: 388
CppName: “FI_LINK_MAX_FORMS”
Name: “LinkMaxForms”
Group: “Link Forms”
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_UNUSED]
Description: “Maximum number of forms across all query words”
Responsibles: “alsafr”
}
Factor {
Index: 389
CppName: “FI_LINK_WEIGHTED_FORMS”
Name: “LinkWeightedForms”
Group: “Link Forms”
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_REARR_USE, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_UNUSED]
Description: “Word-weighted sum of the number of forms”
Responsibles: “alsafr”
}
Factor {
Index: 390
CppName: “FI_LINK_FORMS”
Name: “Link Forms”
Group: “Link Forms”
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_UNUSED]
Description: “Unweighted sum of number of shapes”
Responsibles: “alsafr”
}
Factor {
Index: 391
CppName: “FI_TEXT_RELEV_WEIGHTED_1”
Name: “TR_W1”
Group: “LegacyTR”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_REARR_USE, TG_UNDOCUMENTED, TG_NN_OVER_FEATURES_USE]
Description: “Analogues of the factors of the same name, word weight = 1”
Authors: “denplusplus”
Responsibles: “alsafr”
}
Factor {
Index: 392
CppName: “FI_LINK_RELEV_WEIGHTED_1”
Name: “XLR_W1”
Group: [“Xref”, “Dynamic”]
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: “Analogues of the factors of the same name, word weight = 1”
Authors: “denplusplus”
Responsibles: “alsafr”
}
Factor {
Index: 393
CppName: “FI_TEXT_BM25_FM_WEIGHTED_1”
Name: “TextBM25_Fm_W1”
Group: “TextBM25”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “Analogues of the factors of the same name, word weight = 1”
Authors: “denplusplus”
Responsibles: “alsafr”
}
Factor {
Index: 394
CppName: “FI_TEXT_BM25_SYN_WEIGHTED_1”
Name: “TextBM25_Sy_W1”
Group: “TextBM25”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “Analogues of the factors of the same name, word weight = 1”
Authors: “denplusplus”
Responsibles: “alsafr”
}
Factor {
Index: 395
CppName: “FI_LINK_BM25_WEIGHTED_1”
Name: “LinkBM25_W1”
Group: “LinkBM25”
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_DEPRECATED]
Description: “Analogues of the factors of the same name, word weight = 1”
Authors: “denplusplus”
Responsibles: “alsafr”
}
Factor {
Index: 396
CppName: “FI_TLBM25_WEIGHTED_1”
Name: “TLBM25_W1”
Group: “TextAndLinkBM25”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_L2, TG_LINK_TEXT, TG_DEPRECATED]
Description: “Analogues of the factors of the same name, word weight = 1”
Authors: “denplusplus”
Responsibles: “alsafr”
}
Factor {
Index: 397
CppName: “FI_QSEGMENTS_BREAKS”
Name: “QSegmentsBreaks”
Group: “QSegments”
Tags: [TG_DYNAMIC, TG_DOC, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_NN_OVER_FEATURES_USE]
Description: “Query segments are parts of the query that are themselves frequent queries. The factor shows how segments beat in the text. value 0 – all words occur only within the indicated segments, 1 – all occurrences break the segments”
Authors: “solar”
Responsibles: “solar”
}
Factor {
Index: 398
CppName: “FI_ALICE_MUSIC_TRACK_LYRICS_CMMATCH_TOP5_AVG_MATCH”
Name: “AliceMusicTrackLyricsCMMatchTop5AvgMatch”
Tags: [TG_UNUSED, TG_DYNAMIC, TG_DOC, TG_ALICE_MUSIC, TG_ANNOTATION_NOFILTER, TG_TEXT_MACHINE, TG_ALLOW_USE_FOR_ALICE]
Description: “CMMatchTop5AvgMatch factor value for AliceMusic stream”
Wiki: “https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/lingboost”
Ticket: [“BUKI-2932”]
Authors: “anrodigina”
Responsibles: [“anrodigina”, “gotmanov”, “hommforever”]
ImplementationTime: “2020-03-11”
}
Factor {
Index: 399
CppName: “FI_NUMERALS_PORTION”
Name: “NumeralsPortion”
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “Percentage of different parts of speech in the text. proportion of numerals (among all words for which it was possible to recognize the part of speech)”
Authors: “grechnik”
Responsibles: “greek”
}
Factor {
Index: 400
CppName: “FI_PARTICLES_PORTION”
Name: “ParticlesPortion”
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “share particles”
Responsibles: “alsafr”
}
Factor {
Index: 401
CppName: “FI_ADJ_PRONOUNS_PORTION”
Name: “AdjPronounsPortion”
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “share of pronominal adjectives”
Responsibles: “alsafr”
}
Factor {
Index: 402
CppName: “FI_ADV_PRONOUNS_PORTION”
Name: “AdvPronounsPortion”
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “share of pronominal nouns”
Responsibles: “alsafr”
}
Factor {
Index: 403
CppName: “FI_VERBS_PORTION”
Name: “VerbsPortion”
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “share of verbs”
Responsibles: “alsafr”
}
Factor {
Index: 404
CppName: “FI_FEM_MAS_NOUNS_PORTION”
Name: “FemAndMasNounsPortion”
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “the proportion of words that can be both masculine and feminine nouns, but not neuter, among all nouns (examples: ‘hummingbird’ is an example of an indefinite gender that can be defined in two ways, ‘Alexandra’ is a homonymy ).”
Responsibles: “alsafr”
}
Factor {
Index: 405
CppName: “FI_LINK_QUALITY_FIXED”
Name: “LinkQualityFixed”
Tags: [TG_DOC, TG_LINK_GRAPH, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_UNUSED]
Description: “Quality of incoming links (Leschiner classifier) corrected”
Authors: “somov”
Responsibles: “somov”
}
Factor {
Index: 406
CppName: “FI_HAS_LINK_QUALITY_FIXED”
Name: “HasLinkQualityFixed”
Tags: [TG_DOC, TG_LINK_GRAPH, TG_STATIC, TG_BINARY, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_LINK_TEXT, TG_DEPRECATED]
Description: “Whether LinkQuality was counted for this page or not (didn’t count if there are few links) fixed”
Authors: “somov”
Responsibles: “somov”
}
Factor {
Index: 407
CppName: “FI_NEW_LINK_QUALITY_FIXED”
Name: “NewLinkQualityFixed”
Tags: [TG_DOC, TG_LINK_GRAPH, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_UNUSED]
Description: “Inbound link quality classifier 2 fixed”
Authors: “somov”
Responsibles: “somov”
}
Factor {
Index: 408
CppName: “FI_QUERY_ISORG”
Name: “IsOrg”
DependsOn: [{Feature: [“IsOrg”], Slice: “begemot_query_factors”}]
Group: “Query”
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_THEME_CLASSIF, TG_REARR_USE, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_DEPRECATED]
Description: “In the request, the name of the organization (example: Gazprom, Gazprom) ((http://wiki.yandex-team.ru/ArsenGadzhikurbanov/Wares Description))”
Authors: “arseny”
Responsibles: “arseny”
}
Factor {
Index: 409
CppName: “FI_ALICE_MUSIC_ARTIST_NAME_CM_MATCH_TOP5_AVG_MATCH_VALUE”
Name: “AliceMusicArtistNameCMMatchTop5AvgMatchValue”
Tags: [TG_UNUSED, TG_DYNAMIC, TG_DOC, TG_ALICE_MUSIC, TG_ANNOTATION_NOFILTER, TG_TEXT_MACHINE, TG_ALLOW_USE_FOR_ALICE]
Description: “CMMatchTop5AvgMatchValue factor value for AliceMusic stream”
Wiki: “https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/lingboost”
Ticket: [“BUKI-2932”]
Authors: “anrodigina”
Responsibles: [“anrodigina”, “gotmanov”, “hommforever”]
ImplementationTime: “2020-03-11”
}
Factor {
Index: 410
CppName: “FI_LONGEST_TEXT”
Name: “LongestText”
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_REARR_USE, TG_L2, TG_NN_OVER_FEATURES_USE]
Wiki: “http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/LongText”
Description: “Size of the largest text segment on the page (from factor [18] PureText)”
Authors: “denplusplus”
Responsibles: [“tsimkha”, “alsafr”]
}
Factor {
Index: 411
CppName: “FI_SMART_UKR”
Name: “SmartUkrainian”
Tags: [TG_DOC, TG_DYNAMIC, TG_LOCALIZED_COUNTRY, TG_URL_TEXT, TG_BINARY, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Authors: “denplusplus”
Responsibles: “alsafr”
}
Factor {
Index: 412
CppName: “FI_SMART_BY”
Name: “Smart Belorussian”
Tags: [TG_DOC, TG_DYNAMIC, TG_LOCALIZED_COUNTRY, TG_URL_TEXT, TG_BINARY, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_NN_OVER_FEATURES_USE]
Authors: “denplusplus”
Responsibles: “alsafr”
}
Factor {
Index: 413
CppName: “FI_LR_WITHOUT_RARE”
Name: “LRWithoutRare”
Group: “LegacyLR”
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_DEPRECATED]
Description: “link relevance excluding rare words”
Authors: “denplusplus”
Responsibles: “alsafr”
}
Factor {
Index: 414
CppName: “FI_DIFFERENT_INTERNAL_LINKS”
Name: “DifferentInternalLinks”
Tags: [TG_DOC, TG_LINK_GRAPH, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_DEPRECATED]
Description: “Number of different internal links per page”
Authors: “somov”
Responsibles: “somov”
}
Factor {
Index: 415
CppName: “FI_HAS_DETERMINED_CITIES”
Name: “HasDeterminedCities”
Tags: [TG_DOC, TG_STATIC, TG_STATIC_REGINFO, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_L3_OVERWRITE, TG_NN_OVER_FEATURES_USE]
Description: “A city is defined for the site”
Authors: “denplusplus”
Responsibles: “alsafr”
}
Factor {
Index: 416
CppName: “FI_REGIONAL_U_QUERY_NEW”
Name: “GeoRegionalityUNew”
DependsOn: [{Feature: [“GeoRegionalityUNew”], Slice: “begemot_query_factors”}]
Tags: [TG_QUERY_ONLY, TG_DYNAMIC, TG_THEME_CLASSIF, TG_REARR_USE, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_DEPRECATED]
Group: “Query”
Description: “Request factors – the result of the work ((http://wiki.yandex-team.ru/PoiskovajaPlatforma/Lingvistika/ZaprosnyjeFactory/LocalizovannyjeZaprosy of the request geolocalization classifier)) – a new version of factors [328]-[330]: U – geobeneuseful – regional issuance on demand is meaningless;”
Authors: “esoloviev”
Responsibles: “esoloviev”
}
Factor {
Index: 417
CppName: “FI_REGIONAL_R_QUERY_NEW”
Name: “GeoRegionalityRNew”
DependsOn: [{Feature: [“GeoRegionalityRNew”], Slice: “begemot_query_factors”}]
Group: “Query”
Tags: [TG_QUERY_ONLY, TG_DYNAMIC, TG_THEME_CLASSIF, TG_REARR_USE, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_DEPRECATED]
Description: “Request factors – the result of the work ((http://wiki.yandex-team.ru/PoiskovajaPlatforma/Lingvistika/ZaprosnyjeFactory/LocalizovannyjeZaprosy of the request geolocalization classifier)) – new version of factors [328]-[330]: R – georelevant – regional results in the SERP could be useful, but nothing more;”
Authors: “esoloviev”
Responsibles: “esoloviev”
}
Factor {
Index: 418
CppName: “FI_REGIONAL_V_QUERY_NEW”
Name: “GeoRegionalityVNew”
DependsOn: [{Feature: [“GeoRegionalityVNew”], Slice: “begemot_query_factors”}]
Group: “Query”
Tags: [TG_QUERY_ONLY, TG_DYNAMIC, TG_THEME_CLASSIF, TG_REARR_USE, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_DEPRECATED]
Description: “Request factors – the result of the work ((http://wiki.yandex-team.ru/PoiskovajaPlatforma/Lingvistika/ZaprosnyjeFactory/LocalizovannyjeZaprosy of the request geolocalization classifier)) – a new version of factors [328]-[330]: V – geovital – regional issuance is of fundamental importance.”
Authors: “esoloviev”
Responsibles: “esoloviev”
}
Factor {
Index: 419
CppName: “FI_ALICE_MUSIC_ARTIST_NAME_PER_WORD_CM_MAX_PREDICTION_MIN”
Name: “AliceMusicArtistNamePerWordCMMaxPredictionMin”
Tags: [TG_UNUSED, TG_DYNAMIC, TG_DOC, TG_ALICE_MUSIC, TG_ANNOTATION_NOFILTER, TG_TEXT_MACHINE, TG_ALLOW_USE_FOR_ALICE]
Description: “PerWordCMaxPredictionMin factor value for AliceMusic stream”
Wiki: “https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/lingboost”
Ticket: [“BUKI-2932”]
Authors: “anrodigina”
Responsibles: [“anrodigina”, “gotmanov”, “hommforever”]
ImplementationTime: “2020-03-11”
}
Factor {
Index: 420
CppName: “FI_PAGE_RANK_UKR”
Name: “UkrainePageRank”
Tags: [TG_DOC, TG_LINK_GRAPH, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_UNUSED]
Description: “Ukrainian Page rank”
Responsibles: “alsafr”
}
Factor {
Index: 421
CppName: “FI_QCLASS_DOWNLOAD”
Name: “QClassDownload”
DependsOn: [{Feature: [“QClassDownload”], Slice: “begemot_query_factors”}]
Group: “Query”
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_THEME_CLASSIF, TG_BINARY, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_DEPRECATED]
Description: “=1 – incl. Download formula. Class requests: download/watch online/play/photo/listen”
Authors: “asannikova”
Responsibles: “alsafr”
}
Factor {
Index: 422
CppName: “FI_QCLASS_BRANDNAMES”
Name: “QClassBrandnames”
DependsOn: [{Feature: [“QClassBrandnames”], Slice: “begemot_query_factors”}]
Group: “Query”
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_THEME_CLASSIF, TG_BINARY, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_DEPRECATED]
Description: “The result of the query classifier is that the query contains words from the corresponding dictionary. brand”
Authors: “agorodilov”
Responsibles: “agorodilov”
}
Factor {
Index: 423
CppName: “FI_QCLASS_DISEASE”
Name: “QClassDisease”
DependsOn: [{Feature: [“QClassDisease”], Slice: “begemot_query_factors”}]
Group: “Query”
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_THEME_CLASSIF, TG_BINARY, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_DEPRECATED]
Description: “medical dictionary”
Authors: “agorodilov”
Responsibles: “agorodilov”
}
Factor {
Index: 424
CppName: “FI_QCLASS_KAK”
Name: “QClass”
DependsOn: [{Feature: [“QClassKak”], Slice: “begemot_query_factors”}]
Group: “Query”
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_THEME_CLASSIF, TG_BINARY, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_DEPRECATED]
Description: “question”
Authors: “agorodilov”
Responsibles: “agorodilov”
}
Factor {
Index: 425
CppName: “FI_QCLASS_MOSCOW”
Name: “QClassMoscow”
DependsOn: [{Feature: [“QClassMoscow”], Slice: “begemot_query_factors”}]
Group: “Query”
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_THEME_CLASSIF, TG_BINARY, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_DEPRECATED]
Description: “query specific to Moscow”
Authors: “agorodilov”
Responsibles: “agorodilov”
}
Factor {
Index: 426
CppName: “FI_QCLASS_OAO”
Name: “QClassOAO”
DependsOn: [{Feature: [“QClassOAO”], Slice: “begemot_query_factors”}]
Group: “Query”
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_THEME_CLASSIF, TG_BINARY, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_DEPRECATED]
Description: “organization”
Authors: “agorodilov”
Responsibles: “agorodilov”
}
Factor {
Index: 427
CppName: “FI_QCLASS_PORNO”
Name: “QClassPorno”
DependsOn: [{Feature: [“QClassPorno”], Slice: “begemot_query_factors”}]
Group: “Query”
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_THEME_CLASSIF, TG_BINARY, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_DEPRECATED]
Description: “porn”
Authors: “agorodilov”
Responsibles: “agorodilov”
}
Factor {
Index: 428
CppName: “FI_QCLASS_TRAVEL”
Name: “QClassTravel”
DependsOn: [{Feature: [“QClassTravel”], Slice: “begemot_query_factors”}]
Group: “Query”
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_THEME_CLASSIF, TG_BINARY, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_DEPRECATED]
Description: “travel”
Authors: “agorodilov”
Responsibles: “agorodilov”
}
Factor {
Index: 429
CppName: “FI_VIDEO_RATING”
Name: “video rating”
Ticket: “VIDEOPOISK-342”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/VideoRating”
Tags: [TG_DOC, TG_STATIC, TG_DEPRECATED, TG_OFTEN_ZERO]
Description: “The popularity of the video comes from the video”
Comment: “Outdated. Must be eliminated”
Authors: “bort”
Responsibles: “board”
}
Factor {
Index: 430
CppName: “FI_PERIODIC_LINK_DATES_PERCENT”
Name: “PeriodicLinkDatesPercent”
Tags: [TG_DOC, TG_LINK_GRAPH, TG_STATIC, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_UNUSED]
Description: “The frequency of links to the site”
Authors: “dremov”
Responsibles: “dremov”
}
Factor {
Index: 431
CppName: “FI_LINK_ALMOST_PERIOD”
Name: “LinkAlmostPeriod”
Tags: [TG_DOC, TG_LINK_GRAPH, TG_STATIC, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_UNUSED]
Description: “number of near-periodic links”
Authors: “dremov”
Responsibles: “dremov”
}
Factor {
Index: 432
CppName: “FI_QDOWNER_STAT_POWER”
Name: “QDOwnerStatPower”
Tags: [TG_DYNAMIC, TG_DOWNER, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_USER_SEARCH_EXTERNAL, TG_REARR_USE, TG_OFTEN_ZERO, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_90D, TG_USERFEAT_CLICKS_SHOWS, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Countries: CNT_RELEV
Description: “Number of owner impressions per request, normalized x/(100 + x).”
Authors: “solar”
Responsibles: [“tarum”, “niknik”]
}
Factor {
Index: 433
CppName: “FI_QURL_STAT_POWER”
Name: “QUrlStatPower”
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_REARR_USE, TG_OFTEN_ZERO, TG_USER_SEARCH_EXTERNAL, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_90D, TG_USERFEAT_CLICKS_SHOWS, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Countries: CNT_RELEV
Description: “Number of url impressions per request, normalization x/(100 + x).”
Authors: “solar”
Responsibles: [“tarum”, “niknik”]
}
Factor {
Index: 434
CppName: “FI_HAS_LIRU_CNT”
Name: “HasLiRuCounter”
Tags: [TG_DOC, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “LiveInternet counter available”
Authors: “denplusplus”
Responsibles: “alsafr”
}
Factor {
Index: 435
CppName: “FI_OWNER_REQS_POPULARITY”
Name: “OwnerReqsPopularity”
Tags: [TG_STATIC, TG_OWNER, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_L2, TG_DEPRECATED]
Wiki: “https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/OwnerReqsPopularity”
Description: “Popularity of the owner in requests”
Authors: “denplusplus”
Responsibles: [“diver”, “akhropov”]
}
Factor {
Index: 436
CppName: “FI_DSSM_YA_MUSIC_ASR_EARLY_BINDING_CE”
Name: “DssmYaMusicASREarlyBindingCe”
Tags: [TG_DYNAMIC, TG_DOC, TG_USER, TG_USER_SEARCH, TG_URL_TEXT, TG_DOC_TEXT, TG_DOC_CONTENT, TG_NEURAL, TG_UNUSED, TG_ALICE_MUSIC, TG_RTMODELS_SERVICE, TG_ALLOW_USE_FOR_ALICE]
Description: “Early binding DSSM model trained on reformulations and further trained on the ASR hypothesis of musical requests to Alice”
Ticket: “BUKI-2960”
Authors: [“islobodskov”, “anrodigina”]
Responsibles: [“islobodskov”, “anrodigina”]
}
Factor {
Index: 437
CppName: “FI_DSSM_BERT_DISTILL_SINSIG_CE_COUNTRY_REG_CHAIN”
Name: “DssmBertDistillSinsigCeCountryRegChain”
Tags: [TG_DYNAMIC, TG_DOC, TG_USER, TG_USER_SEARCH, TG_URL_TEXT, TG_DOC_TEXT, TG_NEURAL, TG_USE_MARKUP, TG_ALL_RELEVANCE_MARKUP, TG_SIN_SIG_MARKUP, TG_BERT_DISTILL, TG_UNIMPLEMENTED, TG_DEPRECATED]
Description: “Model trained on a pool of PRS log on Bert prediction, trained on sinsig_ce with a threshold of 0.5, using a chain of regions to a country”
UseArtifact: {Name: “DssmBertDistillSinsigCeCountryRegChain”}
Ticket: “FACTOR-2287”
Authors: [“ivaninap”, “rmplstiltskin”]
Responsibles: [“ivaninap”, “rmplstiltskin”]
}
Factor {
Index: 438
CppName: “FI_DSSM_YA_MUSIC_EARLY_BINDING_CE”
Name: “DssmYaMusicEarlyBindingCe”
Tags: [TG_DYNAMIC, TG_DOC, TG_USER, TG_USER_SEARCH, TG_URL_TEXT, TG_DOC_TEXT, TG_DOC_CONTENT, TG_NEURAL, TG_UNDOCUMENTED, TG_UNUSED, TG_ALICE_MUSIC, TG_RTMODELS_SERVICE, TG_ALLOW_USE_FOR_ALICE]
Description: “An early-binding DSSM model trained on reformulations and retrained on musical requests to Alice”
Ticket: “BUKI-2950”
Authors: “islobodskov”
Responsibles: “islobodskov”
ImplementationTime: “2020-03-17”
}
Factor {
Index: 439
CppName: “FI_SECOND_INDEG_DISTR_XI”
Name: “SecondIndegDistrXi”
Tags: [TG_LINK_GRAPH, TG_OWNER, TG_STATIC, TG_DEPRECATED, TG_UNDOCUMENTED]
Description: “Eleven factors based on the statistical properties of the distributions of incoming vertex degrees referring to a fixed vertex of the hostgraph.
Authors: “filimonov”
Responsibles: “alsafr”
}
Factor {
Index: 440
CppName: “FI_PIRACY_DETECTOR_PREDICT”
Name: “PiracyDetectorPredict”
Ticket: “COMMERCIAL-4”
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_USER, TG_L2, TG_QUERY_DETECTOR_PREDICT, TG_NOT_01, TG_UNUSED]
Description: “The value of the piracy detector calculated in the behemoth.”
MinValue: -10
MaxValue: 10
Authors: [“alejes”, “hygge”]
Responsibles: [“alejes”, “hygge”]
ImplementationTime: “2020-08-17”
}
Factor {
Index: 441
CppName: “FI_ALICE_MUSIC_URL_TYPE_IS_ALBUM”
Name: “AliceMusicUrlTypeIsAlbum”
Tags: [TG_DOC, TG_ALICE_MUSIC, TG_URL_TEXT, TG_BINARY, TG_NN_OVER_FEATURES_USE]
Description: “Yandex music canonized url type – album”
Ticket: “BUKI-2932”
Authors: [“anrodigina”, “gotmanov”]
Responsibles: [“anrodigina”, “gotmanov”]
ImplementationTime: “2020-03-11”
}
Factor {
Index: 442
CppName: “FI_FIRST_VALID_TS_10DAYS”
Name: “FirstValidTs10Days”
Group: “Datetime”
Ticket: “WEBFRESH-695”
Tags: [TG_DATE, TG_DOC, TG_STATIC, TG_FRESHNESS_USE, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “Counted as (10-x) where x is the document’s return in days (continuously) relative to the document’s validity time in the samovar”
Authors: “alejes”
Responsibles: “alejes”
ImplementationTime: “2020-09-27”
}
Factor {
Index: 443
CppName: “FI_HOST_IN_QUERY”
Name: “HostInQuery”
Tags: [TG_DYNAMIC, TG_HOST, TG_URL_TEXT, TG_BINARY, TG_OFTEN_ZERO, TG_L2, TG_UNUSED]
Description: “Document host recognized in request”
Ticket: “WEBFRESH-623”
Authors: “alejes”
Responsibles: “alejes”
ImplementationTime: “2020-04-18”
}
Factor {
Index: 444
CppName: “FI_VITAL_HOST_IN_QUERY”
Name: “VitalHostInQuery”
Tags: [TG_DYNAMIC, TG_DOC, TG_URL_TEXT, TG_BINARY, TG_OFTEN_ZERO, TG_L2, TG_UNUSED]
Description: “The URL only consists of a host that is recognized in the request”
Ticket: “WEBFRESH-623”
Authors: “alejes”
Responsibles: “alejes”
ImplementationTime: “2020-04-18”
}
Factor {
Index: 445
CppName: “FI_YANDEX_NEWS_STORY_URL”
Name: “YandexNewsStoryUrl”
Tags: [TG_DYNAMIC, TG_DOC, TG_URL_TEXT, TG_BINARY, TG_OFTEN_ZERO, TG_L2, TG_UNUSED]
Description: “URL is a Yandex news story”
Ticket: “WEBFRESH-685”
Authors: [“hygge”, “alejes”]
Responsibles: [“hygge”, “alejes”]
ImplementationTime: “2020-08-28”
}
Factor {
Index: 446
CppName: “FI_RC_SPYLOG_URL_RATIONAL_SIGMOID_D1T240”
Name: “RcSpylogUrlRationalSigmoidD1T240”
Group: “Rapid Clicks”
Tags: [TG_STATIC, TG_DOC, TG_USER, TG_BROWSER, TG_L2, TG_DATA_FROM_BIGRT, TG_UNDOCUMENTED, TG_UNIMPLEMENTED, TG_UNUSED]
Description: “URL feature computed from rapid clicks spy_log counters with decay of 1 day”
Ticket: “USERFEAT-1493”
Authors: [“skorodumov-s”]
Responsibles: [“skorodumov-s”, “tarum”]
}
Factor {
Index: 447
CppName: “FI_RC_SPYLOG_URL_RATIONAL_SIGMOID_D1T240_FROZEN”
Name: “RcSpylogUrlRationalSigmoidD1T240Frozen”
Group: “Rapid Clicks”
Tags: [TG_STATIC, TG_DOC, TG_USER, TG_BROWSER, TG_L2, TG_DATA_FROM_BIGRT, TG_UNDOCUMENTED, TG_SPYLOG_RAPID_CLICKS_BIGRT, TG_NN_OVER_FEATURES_USE]
Description: “URL feature computed from rapid clicks spy_log counters with decay of 1 day”
Ticket: “USERFEAT-1493”
Authors: [“skorodumov-s”]
Responsibles: [“skorodumov-s”, “tarum”]
ImplementationTime: “2020-09-01”
}
Factor {
Index: 448
CppName: “FI_RC_SPYLOG_URL_RATIONAL_SIGMOID_D0_5T30”
Name: “RcSpylogUrlRationalSigmoidD0_5T30”
Group: “Rapid Clicks”
Tags: [TG_STATIC, TG_DOC, TG_USER, TG_BROWSER, TG_L2, TG_DATA_FROM_BIGRT, TG_UNDOCUMENTED, TG_UNIMPLEMENTED, TG_UNUSED]
Description: “URL feature computed from rapid clicks spy_log counters with decay of 0.5 days”
Ticket: “USERFEAT-1493”
Authors: [“skorodumov-s”]
Responsibles: [“skorodumov-s”, “tarum”]
}
Factor {
Index: 449
CppName: “FI_RC_SPYLOG_URL_RATIONAL_SIGMOID_D0_5T30_FROZEN”
Name: “RcSpylogUrlRationalSigmoidD0_5T30Frozen”
Group: “Rapid Clicks”
Tags: [TG_STATIC, TG_DOC, TG_USER, TG_BROWSER, TG_L2, TG_DATA_FROM_BIGRT, TG_UNDOCUMENTED, TG_SPYLOG_RAPID_CLICKS_BIGRT, TG_NN_OVER_FEATURES_USE]
Description: “URL feature computed from rapid clicks spy_log counters with decay of 0.5 day”
Ticket: “USERFEAT-1493”
Authors: [“skorodumov-s”]
Responsibles: [“skorodumov-s”, “tarum”]
ImplementationTime: “2020-09-01”
}
Factor {
Index: 450
CppName: “FI_TIMESTAMP”
Name: “Timestamp”
Group: “Datetime”
Tags: [TG_DATE, TG_DOC, TG_STATIC, TG_REARR_USE, TG_FRESHNESS_USE, TG_UNUSED]
Description: “Counted as (80 – x) / 80, where x is the age of the document in hours. The factors only make sense for the speedbot base (last 80 hours). Not used in ranking. Used in reranking.”
Authors: “melton”
Responsibles: [“melton”, “alsafr”]
}
Factor {
Index: 451
CppName: “FI_ADD_TIME_FULL”
Name: “AddTimeFull”
Group: “Datetime”
Tags: [TG_DATE, TG_DOC, TG_STATIC, TG_REARR_USE, TG_FRESHNESS_USE, TG_UNUSED]
Description: “Counted as (80 – x) / 80, where x is the age of the document in hours. The factors only make sense for the speedbot base (last 80 hours). Not used in ranking. Used in reranking.”
Authors: “melton”
Responsibles: [“melton”, “alsafr”]
}
Factor {
Index: 452
CppName: “FI_SWBM25”
Name: “Swbm25”
Wiki: “http://wiki.yandex-team.ru/SWBM25”
Group: “SWBM25”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_DEPRECATED]
Description: “Cunning BM25 in a sliding window. The size of the window is set in sentences. Wildcards are used for headings and the beginning of the document. Morphological proximity and text structure are taken into account. The weight of the window fades away from the beginning of the document.”
Authors: “alsafr”
Responsibles: “alsafr”
}
Factor {
Index: 453
CppName: “FI_PLM”
Name: “PositionLanguageModel”
Ticket: “COMBPROLAB-51”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/PositionLanguageModel”
Group: “PositionLanguageModel”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_REARR_USE, TG_DEPRECATED]
Description: “A factor about how good a snippet can be.”
Responsibles: “alsafr”
}
Factor {
Index: 454
CppName: “FI_TEXT_PAIR_W1”
Name: “TxtPair_W1”
Group: “TextBM25”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “Simple BM25 by word pairs – we take all pairs of words in the query and count the number of their occurrences in the document text. Weight = 1. Comm Does not work if the query contains a stop word”
Authors: “gulin”
Responsibles: “gulin”
}
Factor {
Index: 455
CppName: “FI_AURA_DOC_LOG_SHARED”
Name: “AuraDocLogShared”
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_DEPRECATED]
Description: “Logarithm of the number of shingles where this document is not unique”
Authors: “antonovvk”
Responsibles: [“antonovk”, “smax”]
}
Factor {
Index: 456
CppName: “FI_AURA_DOC_LOG_AUTHOR”
Name: “AuraDocLogAuthor”
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_DEPRECATED]
Description: “Logarithm of the number of shingles on which a given document owner is recognized as the author”
Authors: “antonovvk”
Responsibles: [“antonovk”, “smax”]
}
Factor {
Index: 457
CppName: “FI_AURA_DOC_MEAN_SHARED_WEIGHT”
Name: “AuraDocMeanSharedWeight”
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_DEPRECATED]
Description: “Average weight of non-unique shingles in this document”
Authors: “antonovvk”
Responsibles: [“antonovk”, “smax”]
}
Factor {
Index: 458
CppName: “FI_MARKET_QUALITY_RATING”
Name: “MarketQualityRating”
Tags: [TG_OWNER, TG_STATIC, TG_OFTEN_ZERO, TG_COMMERCIAL, TG_NN_OVER_FEATURES_USE]
Description: “Mascot feature MarketQualityRating”
Ticket: “SEARCHSPAM-15531”
Authors: [“bikulov”]
Responsibles: [“bikulov”, “sdormidontov”]
ImplementationTime: “2020-09-30”
}
Factor {
Index: 459
CppName: “FI_MEDICAL2_HOST_QUALITY”
Name: “Medical2HostQuality”
Ticket: “SENS-87”
Authors: [“anrodigina”]
Responsibles: [“anrodigina”, “hommforever”]
Description: “Medical host quality for new marks.”
Tags: [TG_HOST, TG_STATIC, TG_OFTEN_ZERO, TG_UNUSED, TG_NOT_01]
MinValue: -1
MaxValue: 1
ImplementationTime: “2021-01-12”
}
Factor {
Index: 460
CppName: “FI_MEDICAL2_HOST_QUALITY_FRESH”
Name: “Medical2HostQualityFresh”
Ticket: “SENS-87”
Authors: [“anrodigina”]
Responsibles: [“anrodigina”, “hommforever”]
Description: “Medical host quality for new marks for experiments.”
Tags: [TG_HOST, TG_STATIC, TG_OFTEN_ZERO, TG_UNUSED, TG_NOT_01]
MinValue: -1
MaxValue: 1
ImplementationTime: “2021-01-12”
}
Factor {
Index: 461
CppName: “FI_FIN_LAW_HOST_QUALITY”
Name: “FinLawHostQuality”
Ticket: “SENS-85”
Authors: [“anrodigina”]
Responsibles: [“anrodigina”, “hommforever”]
Description: “Finance or law host quality for new marks.”
Tags: [TG_HOST, TG_STATIC, TG_OFTEN_ZERO, TG_UNUSED, TG_NOT_01, TG_USED_IN_CONF_REARR]
MinValue: -1
MaxValue: 1
ImplementationTime: “2021-01-12”
}
Factor {
Index: 462
CppName: “FI_FIN_LAW_HOST_QUALITY_FRESH”
Name: “FinLawHostQualityFresh”
Ticket: “SENS-85”
Authors: [“anrodigina”]
Responsibles: [“anrodigina”, “hommforever”]
Description: “Finance or law host quality for new marks for experiments.”
Tags: [TG_HOST, TG_STATIC, TG_OFTEN_ZERO, TG_UNUSED, TG_NOT_01]
MinValue: -1
MaxValue: 1
ImplementationTime: “2021-01-12”
}
Factor {
Index: 463
CppName: “FI_SOS_HOST_QUALITY”
Name: “SosHostQuality”
Ticket: “SENS-84”
Authors: [“anrodigina”]
Responsibles: [“anrodigina”, “hommforever”]
Description: “Finance or law host quality for new marks.”
Tags: [TG_HOST, TG_STATIC, TG_OFTEN_ZERO, TG_UNUSED, TG_UNIMPLEMENTED, TG_NOT_01]
MinValue: -1
MaxValue: 1
ImplementationTime: “2021-01-12”
}
Factor {
Index: 464
CppName: “FI_SOS_HOST_QUALITY_FRESH”
Name: “SosHostQualityFresh”
Ticket: “SENS-84”
Authors: [“anrodigina”]
Responsibles: [“anrodigina”, “hommforever”]
Description: “Finance or law host quality for new marks for experiments.”
Tags: [TG_HOST, TG_STATIC, TG_OFTEN_ZERO, TG_UNUSED, TG_UNIMPLEMENTED, TG_NOT_01]
MinValue: -1
MaxValue: 1
ImplementationTime: “2021-01-12”
}
Factor {
Index: 465
CppName: “FI_CS_DOCUMENTATION_HOST”
Name: “CsDocumentationHost”
Ticket: “SEARCHPLAY-101”
Authors: “alejes”
Responsibles: “alejes”
Description: “Factor for host in list of documentation cs hosts for experiments”
Tags: [TG_HOST, TG_STATIC, TG_OFTEN_ZERO, TG_UNUSED, TG_UNIMPLEMENTED]
}
Factor {
Index: 466
CppName: “FI_REMOVED_466”
Name: “Remved_466”
Tags: [TG_REMOVED]
}
Factor {
Index: 467
CppName: “FI_REG_HOST_RANK”
Name: “RegHostRank”
Group: “RegHostStatic”
Tags: [TG_LOCALIZED_COUNTRY, TG_LINK_GRAPH, TG_OWNER, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_DEPRECATED]
Description: “It is calculated in the same way as the HostRank factor, but not on the entire owner-graph, but on its subgraph, consisting of the owners of the given region. Belonging to the region is determined by the TLD, or by the presence of pages in the index from the given owner’ and, about which geo or geoa the classifier says that they are from this region. It is mapped in the same way as the HostRank factor, into a number from 0 to 1 with 256 gradations”
Authors: “yoda”
Responsibles: “alsafr”
}
Factor {
Index: 468
CppName: “FI_REG_IS_WIKI”
Name: “RegIsWiki”
Group: “RegHostStatic”
Tags: [TG_LOCALIZED_COUNTRY, TG_HOST, TG_STATIC, TG_WIKIPEDIA, TG_UNDOCUMENTED, TG_L2, TG_REARR_USE, TG_NN_OVER_FEATURES_USE]
Description: “Document from the language section of wikipedia corresponding to the user’s region”
Authors: “yoda”
Responsibles: “alsafr”
}
Factor {
Index: 469
CppName: “FI_LANGUAGE_COMPLIANCE”
Name: “Language Compliance”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_BINARY, TG_REARR_USE, TG_UNDOCUMENTED, TG_NN_OVER_FEATURES_USE]
Description: “Document language matches query language”
Authors: “ekrokhalev”
Responsibles: “lamo”
}
Factor {
Index: 470
CppName: “FI_COUNTRY_POPULAR_Q”
Name: “CountryPopularQ”
DependsOn: [{Feature: [“CountryPopularQ”], Slice: “begemot_query_factors”}]
Group: “Query”
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_REARR_USE, TG_OFTEN_ZERO, TG_L2, TG_DEPRECATED]
Countries: CNT_ALL
Description: “Query popularity within the country”
Wiki: “http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/PopularQ”
Authors: “denplusplus”
Responsibles: [“diver”, “akhropov”]
}
Factor {
Index: 471
CppName: “FI_COUNTRY_Q_DIVERSITY”
Name: “CountryQDiversity”
DependsOn: [{Feature: [“CountryQDiversity”], Slice: “begemot_query_factors”}]
Group: “Query”
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_REARR_USE, TG_OFTEN_ZERO, TG_L2, TG_DEPRECATED]
Countries: CNT_ALL
Description: “The degree of centralization of the points from which the request is made (within the country)”
Wiki: “http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/QDiversity”
Authors: “denplusplus”
Responsibles: [“diver”, “akhropov”]
}
Factor {
Index: 472
CppName: “FI_COUNTRY_Q_DIVERSITY2”
Name: “CountryQDiversity2”
DependsOn: [{Feature: [“CountryQDiversity2”], Slice: “begemot_query_factors”}]
Group: “Query”
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_REARR_USE, TG_OFTEN_ZERO, TG_L2, TG_DEPRECATED]
Countries: CNT_ALL
Description: “Geographic distribution of the request within the country”
Wiki: “http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/Diversity2”
Authors: “denplusplus”
Responsibles: [“diver”, “akhropov”]
}
Factor {
Index: 473
CppName: “FI_COUNTRY_HOUR”
Name: “CountryHour”
DependsOn: [{Feature: [“CountryHour”], Slice: “begemot_query_factors”}]
Group: “Query”
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_OFTEN_ZERO, TG_L2, TG_DEPRECATED]
Countries: CNT_ALL
Description: “The most frequent hour for this request”
Wiki: “http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/HourDiversity”
Authors: “denplusplus”
Responsibles: [“diver”, “akhropov”]
}
Factor {
Index: 474
CppName: “FI_COUNTRY_HOUR_DIVERSITY”
Name: “CountryHourDiversity”
DependsOn: [{Feature: [“CountryHourDiversity”], Slice: “begemot_query_factors”}]
Group: “Query”
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_OFTEN_ZERO, TG_L2, TG_DEPRECATED]
Countries: CNT_ALL
Description: “Degree of expressiveness of setting requests at different times of the day (within the country)”
Wiki: “http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/HourDiversity”
Authors: “denplusplus”
Responsibles: [“diver”, “akhropov”]
}
Factor {
Index: 475
CppName: “FI_REMOVED_475”
Name: “Removed_475”
Tags: [TG_REMOVED]
}
Factor {
Index: 476
CppName: “FI_NATIONAL_DOMAIN”
Name: “NationalDomain”
Tags: [TG_DOC, TG_DYNAMIC, TG_LOCALIZED_COUNTRY, TG_BINARY, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “Document country (domain) and user country match ((http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/OpisanijaFaktorov#nationaldomain more))”
Authors: “vvp”
Responsibles: “alsafr”
}
Factor {
Index: 477
CppName: “FI_IS_PORNO_ADVERT”
Name: “IsPornoAdvert”
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_BINARY, TG_REARR_USE, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “Porn ads on the page”
Wiki: “http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/IsPornoAdvert”
Authors: “shagarov”
Responsibles: “ashgarov”
}
Factor {
Index: 478
CppName: “FI_RC_SPYLOG_URL_RATIONAL_SIGMOID_D3T120”
Name: “RcSpylogUrlRationalSigmoidD3T120”
Group: “Rapid Clicks”
Tags: [TG_STATIC, TG_DOC, TG_USER, TG_BROWSER, TG_L2, TG_DATA_FROM_BIGRT, TG_UNDOCUMENTED, TG_UNIMPLEMENTED, TG_UNUSED]
Description: “URL feature computed from rapid clicks spy_log counters with decay of 3 days”
Ticket: “USERFEAT-1493”
Authors: [“skorodumov-s”]
Responsibles: [“skorodumov-s”, “tarum”]
}
Factor {
Index: 479
CppName: “FI_COUNTRY_QUERY_REGIONALITY”
Name: “CountryQueryRegionality”
DependsOn: [{Feature: [“CountryQueryRegionality”], Slice: “begemot_query_factors”}]
Group: “Query”
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_THEME_CLASSIF, TG_UNDOCUMENTED, TG_L2, TG_DEPRECATED]
Description: “Country localizability classifier – how far the query implies country context”
Authors: “shutovich”
Responsibles: “shutovich”
}
Factor {
Index: 480
CppName: “FI_NUM_SLASHES”
Name: “NumSlashes”
Tags: [TG_DOC, TG_STATIC, TG_URL_TEXT, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “Number of slashes in url”
Authors: “denplusplus”
Responsibles: “alsafr”
}
Factor {
Index: 481
CppName: “FI_BM25F_DPR_OBSOLETE”
Name: “BM25FdPR_obsolete”
Group: “BM25F”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_REARR_USE, TG_UNUSED, TG_L2]
Description: “BM25 with different parameters for different fields, including incoming anchor text. Text weights of incoming links to the page are normalized depending on the delta page rank of the link”
Authors: [“grechnik”, “kustarev”]
Responsibles: “greek”
}
Factor {
Index: 482
CppName: “FI_WATCH_VIDEO”
Name: “WatchVideo”
Tags: [TG_DOC, TG_STATIC, TG_REARR_USE, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “The presence of an embedded video player on the page”
Responsibles: “osenzen”
}
Factor {
Index: 483
CppName: “FI_DOWNLOAD_VIDEO”
Name: “DownloadVideo”
Tags: [TG_DOC, TG_STATIC, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “Video for download”
Responsibles: “alsafr”
}
Factor {
Index: 484
CppName: “FI_RC_SPYLOG_URL_RATIONAL_SIGMOID_D3T120_FROZEN”
Name: “RcSpylogUrlRationalSigmoidD3T120Frozen”
Group: “Rapid Clicks”
Tags: [TG_STATIC, TG_DOC, TG_USER, TG_BROWSER, TG_L2, TG_DATA_FROM_BIGRT, TG_UNDOCUMENTED, TG_SPYLOG_RAPID_CLICKS_BIGRT, TG_NN_OVER_FEATURES_USE]
Description: “URL feature computed from rapid clicks spy_log counters with decay of 3 days”
Ticket: “USERFEAT-1493”
Authors: [“skorodumov-s”]
Responsibles: [“skorodumov-s”, “tarum”]
ImplementationTime: “2020-09-01”
}
Factor {
Index: 485
CppName: “FI_RC_SPYLOG_URL_RATIONAL_SIGMOID_D14T300”
Name: “RcSpylogUrlRationalSigmoidD14T300”
Group: “Rapid Clicks”
Tags: [TG_STATIC, TG_DOC, TG_USER, TG_BROWSER, TG_L2, TG_DATA_FROM_BIGRT, TG_UNDOCUMENTED, TG_UNIMPLEMENTED, TG_UNUSED]
Description: “URL feature computed from rapid clicks spy_log counters with decay of 14 days”
Ticket: “USERFEAT-1493”
Authors: [“skorodumov-s”]
Responsibles: [“skorodumov-s”, “tarum”]
}
Factor {
Index: 486
CppName: “FI_SUBRELEV”
Name: “SubRelevance”
Tags: [TG_DOC, TG_TRANS, TG_REARR_USE, TG_UNUSED, TG_OFTEN_ZERO]
Description: “A service factor that was needed for site search, and will be needed in the future.”
Authors: “karpik”
Responsibles: “apos”
}
Factor {
Index: 487
CppName: “FI_GSK_URL_MODEL”
Name: “GskUrlModel”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/gsk”
Tags: [TG_DOC, TG_STATIC, TG_URL_TEXT, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “The factor is calculated from the url text using the quality/seq/gsk sequence classifier”
Authors: “gulin”
Responsibles: “gulin”
}
Factor {
Index: 488
CppName: “FI_URL_TRIGRAMS”
Name: “UrlTrigrams”
Wiki: “http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/UrlTrigrams”
Tags: [TG_DOC, TG_STATIC, TG_URL_TEXT, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “Model with training of each trigram on ‘+’ and ‘-‘ urls. Doesn’t depend on query.”
Authors: [“botay”, “denplusplus”]
Responsibles: “alsafr”
}
Factor {
Index: 489
CppName: “FI_RC_SPYLOG_URL_RATIONAL_SIGMOID_D14T300_FROZEN”
Name: “RcSpylogUrlRationalSigmoidD14T300Frozen”
Group: “Rapid Clicks”
Tags: [TG_STATIC, TG_DOC, TG_USER, TG_BROWSER, TG_L2, TG_DATA_FROM_BIGRT, TG_UNDOCUMENTED, TG_SPYLOG_RAPID_CLICKS_BIGRT, TG_NN_OVER_FEATURES_USE]
Description: “URL feature computed from rapid clicks spy_log counters with decay of 14 days”
Ticket: “USERFEAT-1493”
Authors: [“skorodumov-s”]
Responsibles: [“skorodumov-s”, “tarum”]
ImplementationTime: “2020-09-01”
}
Factor {
Index: 490
CppName: “FI_RC_SPYLOG_AGE”
Name: “RcSpylogAge”
Group: “Rapid Clicks”
Tags: [TG_STATIC, TG_DOC, TG_USER, TG_BROWSER, TG_L2, TG_DATA_FROM_BIGRT, TG_NOT_01, TG_UNDOCUMENTED, TG_UNIMPLEMENTED, TG_UNUSED]
Description: “Age of rapid clicks spy_log update, in seconds”
Ticket: “USERFEAT-1493”
Authors: [“skorodumov-s”]
Responsibles: [“skorodumov-s”, “tarum”]
MinValue: 0
MaxValue: 2592000
}
Factor {
Index: 491
CppName: “FI_RC_SPYLOG_FRESHNESS”
Name: “RcSpylogFreshness”
Group: “Rapid Clicks”
Tags: [TG_STATIC, TG_DOC, TG_USER, TG_BROWSER, TG_L2, TG_DATA_FROM_BIGRT, TG_UNDOCUMENTED, TG_UNIMPLEMENTED, TG_UNUSED]
Description: “Freshness of rapid clicks spy_log update”
Ticket: “USERFEAT-1493”
Authors: [“skorodumov-s”]
Responsibles: [“skorodumov-s”, “tarum”]
}
Factor {
Index: 492
CppName: “FI_YMW_FULL”
Name: “YmwFull”
Group: “Combined Abs”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_REARR_USE, TG_DEPRECATED]
Description: “The size of the minimum piece of text that includes all query words found in the document. Not currently used. ((http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/YMW more))”
Authors: “alsafr”
Responsibles: “alsafr”
}
Factor {
Index: 493
CppName: “FI_BCLM”
Name: “Bclm”
Group: “Combined Abs”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_REARR_USE, TG_UNDOCUMENTED, TG_NN_OVER_FEATURES_USE]
Description: “Buettcher, Clarke and Lushman name factor (modified) ((http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/BCLm more))”
Authors: “alsafr”
Responsibles: “alsafr”
}
Factor {
Index: 494
CppName: “FI_QUERY_COMMERCIALITY_MX”
Name: “QueryCommercialityMx”
DependsOn: [{Feature: [“QueryCommercialityMx”], Slice: “begemot_query_factors”}]
Ticket: “SEARCHSPAM-2317”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/QueryCommercialityMx”
Group: “Query”
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_COMMERCIAL, TG_TRANS, TG_REARR_USE, TG_L2, TG_DEPRECATED]
Countries: [CNT_RU, CNT_TR]
Description: “A measure of the ‘commerciality’ of a request. It is a complexly calculated MatrixNet factor by a formula according to the purchase dictionary in direct + according to user request logs + additional intent dictionaries. Requests with the intent to buy the factor tends to ->1 product requests ->0.6 with the intent not to buy , reviews, etc. -> 0 about him))”
Authors: [“anelyubin”, “kvn”]
Responsibles: [“anelyubin”, “kvn”]
DependsOn: [{Feature: [“QueryNonCommerciality”, “ProductCategoryQuery”, “ProductCategoryVendor”, “IsNavQuery”, “QClassDownload”, “QClassBrandnames”, “QClassDisease”, “QClassKak”, “QClassMoscow”, “QClassOAO”, “QClassPorno” , “QClassTravel”, “CountryPopularQ”]}]
}
Factor {
Index: 495
CppName: “FI_FIELD_LM”
Name: “FieldLM”
Group: “BM25F”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “Unigram language model. The language model is modeled according to the document, smoothed by the general language model. When building the model according to the document, information is used about in which field of the document the query word was found (Title, head or plain text)”
Authors: “ylogachev”
Responsibles: “ylogachev”
}
Factor {
Index: 496
CppName: “FI_GEO_CITY_URL_REGION_CITY”
Name: “GeoCityUrlRegionCity”
Ticket: “BUKI-1125”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/GeoCityUrl”
Tags: [TG_DOC, TG_DYNAMIC, TG_LOCALIZED_CITY, TG_URL_TEXT, TG_BINARY, TG_REARR_USE, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “Coincidence of the geography determined from the url of the document and the city of the request (ip or lr)”
Authors: “denplusplus”
Responsibles: “alsafr”
}
Factor {
Index: 497
CppName: “FI_GEO_CITY_URL_REGION_REGION”
Name: “GeoCityUrlRegionRegion”
Ticket: “BUKI-1125”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/GeoCityUrl”
Tags: [TG_DOC, TG_DYNAMIC, TG_LOCALIZED_REGION, TG_URL_TEXT, TG_BINARY, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “Coincidence of the geography determined from the document url and the request area (ip or lr)”
Authors: “denplusplus”
Responsibles: “alsafr”
}
Factor {
Index: 498
CppName: “FI_GEO_CITY_URL_REGION_COUNTRY”
Name: “GeoCityUrlRegionCountry”
Ticket: “BUKI-1125”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/GeoCityUrl”
Tags: [TG_DOC, TG_DYNAMIC, TG_LOCALIZED_COUNTRY, TG_URL_TEXT, TG_BINARY, TG_REARR_USE, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “Coincidence of the geography determined from the url of the document and the country of the request (ip or lr). Relevant for Russia and Ukraine.”
Authors: “denplusplus”
Responsibles: “alsafr”
}
Factor {
Index: 499
CppName: “FI_GEO_CITY_URL_GEO_CITY_CITY”
Name: “GeoCityUrlGeoCityCity”
Ticket: “BUKI-1125”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/GeoCityUrl”
Tags: [TG_DOC, TG_DYNAMIC, TG_LOCALIZED_GEOINQUERY, TG_URL_TEXT, TG_BINARY, TG_REARR_USE, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “Coincidence of the geography determined from the url of the document and the city in the request (GeoCity rule)”
Authors: “denplusplus”
Responsibles: “alsafr”
}
Factor {
Index: 500
CppName: “FI_PAY_APP_DETECTOR_PREDICT”
Name: “PayAppDetectorPredict”
Ticket: “COMMERCIAL-19”
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_USER, TG_L2, TG_QUERY_DETECTOR_PREDICT, TG_NOT_01, TG_UNUSED]
Description: “The value of the forked commerce detector calculated in behemoth.”
MinValue: -10
MaxValue: 10
Authors: [“alejes”, “hygge”]
Responsibles: [“alejes”, “hygge”]
ImplementationTime: “2020-08-01”
}
Factor {
Index: 501
CppName: “FI_TITLE_TRIGRAMS_Q”
Name: “TitleTrigramsQuery”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_REARR_USE, TG_UNDOCUMENTED, TG_NN_OVER_FEATURES_USE]
Description: “Calculates query coverage by letter trigrams of document header”
Authors: “akorsun”
Responsibles: “alsafr”
}
Factor {
Index: 502
CppName: “FI_TITLE_TRIGRAMS_T”
Name: “TitleTrigramsTitle”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_REARR_USE, TG_UNDOCUMENTED, TG_NN_OVER_FEATURES_USE]
Description: “Calculates the heading coverage by letter trigrams of the document heading”
Authors: “akorsun”
Responsibles: “alsafr”
}
Factor {
Index: 503
CppName: “FI_INLINKS_MODEL”
Name: “InlinkModel”
Ticket: “COMBPROLAB-69”
Group: [“Xref”, “Dynamic”]
Tags: [TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_UNUSED]
Description: “A probabilistic model built on the texts of incoming links”
Authors: “grechnik”
Responsibles: “greek”
}
Factor {
Index: 504
CppName: “FI_QUERY_WORD_SEQUENCES_TR”
Name: “QueryWordSequencesSTR”
Group: “QueryWordSequencesTR”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_NN_OVER_FEATURES_USE]
Description: “Calculates the sum of occurrences of the following form: a sequence of query words longer than two occurring in one sentence; normalized to the length of the document.”
Authors: “akorsun”
Responsibles: “alsafr”
}
Factor {
Index: 505
CppName: “FI_QUERY_WORD_SEQUENCES_LR”
Name: “QueryWordSequencesLR”
Group: “QueryWordSequencesLR”
Tags: [TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: “Counts the sum of occurrences of the following form: a sequence of query words longer than two, encountered in one link; normalized to the number of links.”
Authors: “akorsun”
Responsibles: “alsafr”
}
Factor {
Index: 506
CppName: “FI_OWNER_NAV_QUOTA”
Name: “OwnerNavQuota”
Tags: [TG_STATIC, TG_OWNER, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_REARR_USE, TG_OFTEN_ZERO, TG_L2, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_CLICKS_SHOWS, TG2DEPREC_DEP]
Description: “Navigation click-through rate”
Authors: “ulyanov”
Responsibles: [“ulyanov”, “tarum”, “niknik”]
}
Factor {
Index: 507
CppName: “FI_GEO_RELEV_ALIEN_CITY”
Name: “GeoRelevAlienCity”
Tags: [TG_DOC, TG_DYNAMIC, TG_LOCALIZED_CITY, TG_BINARY, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_L3_OVERWRITE, TG_NN_OVER_FEAS_USE]
Description: “The result has a georeference that does not match the user’s geography at the city level ([415]==1 && [215]==0)”
Authors: “esoloviev”
Responsibles: “esoloviev”
}
Factor {
Index: 508
CppName: “FI_GEO_V_QUERY_IN_USERS_CITY”
Name: “GeoVQueryInUserCity”
Tags: [TG_DOC, TG_DYNAMIC, TG_LOCALIZED_CITY, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “Geovitality of the query for results from the user’s region”
Authors: “esoloviev”
Responsibles: “esoloviev”
}
Factor {
Index: 509
CppName: “FI_GEO_V_QUERY_IN_ALIEN_CITY”
Name: “GeoVQueryInAlienCity”
Tags: [TG_DOC, TG_DYNAMIC, TG_LOCALIZED_CITY, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “Geovitality of the query for results not from the user’s region”
Authors: “esoloviev”
Responsibles: “esoloviev”
}
Factor {
Index: 510
CppName: “FI_HOST_RELIABILITY”
Name: “HostReliability”
Tags: [TG_HOST, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_DEPRECATED]
Description: “percentage of urls that respond without errors”
Responsibles: “alsafr”
}
Factor {
Index: 511
CppName: “FI_DMOZ_THEME_MATCH_ALL”
Name: “DmozThemeMatchAll”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_THEME_CLASSIF, TG_UNDOCUMENTED, TG_L2, TG_DEPRECATED]
Description: “Coincidence of the thematic spectrum (according to DMOZ) of the request and the document. The topic of the request is determined by ((http://wiki.yandex-team.ru/JandeksPoisk/ZarubezhnyjjInternet/DMOZqueryClassifier1 by the DMOZTheme wizard’s rule)) The subject of the document is determined by an automatic classifier”
Authors: [“ekrokhalev”, “pyal”]
Responsibles: [“pyal”, “lamo”]
}
Factor {
Index: 512
CppName: “FI_DMOZ_THEME_MATCH_BEST”
Name: “DmozThemeMatchBest”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_THEME_CLASSIF, TG_UNDOCUMENTED, TG_L2, TG_DEPRECATED]
Description: “Coincidence of the thematic spectrum (according to DMOZ) of the query and the document. The subject of the query is determined by the best result ((http://wiki.yandex-team.ru/JandeksPoisk/ZarubezhnyjjInternet/DMOZqueryClassifier1 DMOZTheme sorcerer’s rules)) The subject of the document is determined by an automatic classifier”
Authors: [“ekrokhalev”, “pyal”]
Responsibles: [“pyal”, “lamo”]
}
Factor {
Index: 513
CppName: “FI_MPSA”
Name: “MPsa”
Group: “Combined Abs”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_REARR_USE, TG_UNDOCUMENTED, TG_NN_OVER_FEATURES_USE]
Description: “Estimates the minimum distance between pairs of query words, taking into account the distance of the pair from the beginning of the document (Minimal Pair Size with Attenuation). Pairs are understood as all consecutive bigrams of query words. Thus, the number of pairs is equal to the number of words in the query, reduced by 1. Accordingly , the factor makes sense for requests consisting of more than one word.
Authors: “alsafr”
Responsibles: “alsafr”
}
Factor {
Index: 514
CppName: “FI_BCLM2”
Name: “Bclm2”
Group: “Combined Abs”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_NN_OVER_FEATURES_USE]
Description: “Different from BCLm in that the weights of all words are considered the same. ((http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/BCLm2 BCLm2))”
Authors: “alsafr”
Responsibles: “alsafr”
}
Factor {
Index: 515
CppName: “FI_ABSOLUTE_PLM”
Name: “AbsolutePLM”
Group: “Combined Abs”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_NN_OVER_FEATURES_USE]
Description: “Text relevance based on the language model, taking into account the absolute position. We go through the text with a window of 20 words, build a language model for each window (that is, a probability distribution on the words of the Russian language) and calculate the probability of generating a query. We fine for moving away from the beginning of the document model.”
Authors: “kustarev”
Responsibles: “alsafr”
}
Factor {
Index: 516
CppName: “FI_PAGE_REGION_COVERAGE”
Name: “PageRegionCoverage”
Tags: [TG_DOC, TG_STATIC, TG_STATIC_REGINFO, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Authors: “denplusplus”
Responsibles: “alsafr”
}
Factor {
Index: 517
CppName: “FI_PAGE_REGION_SIZE”
Name: “PageRegionSize”
Tags: [TG_DOC, TG_STATIC, TG_STATIC_REGINFO, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_L3_OVERWRITE, TG_NN_OVER_FEATURES_USE]
Description: “Page region size”
Authors: “denplusplus”
Responsibles: “alsafr”
}
Factor {
Index: 518
CppName: “FI_PAGE_REGION_REL_COVERAGE”
Name: “PageRegionRelCoverage”
Tags: [TG_DOC, TG_STATIC, TG_STATIC_REGINFO, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_L3_OVERWRITE, TG_NN_OVER_FEATURES_USE]
Authors: “denplusplus”
Responsibles: “alsafr”
}
Factor {
Index: 519
CppName: “FI_RC_SPYLOG_FRESHNESS_AT_REQ”
Name: “RcSpylogFreshnessAtReq”
Group: “Rapid Clicks”
Tags: [TG_STATIC, TG_DOC, TG_USER, TG_BROWSER, TG_L2, TG_DATA_FROM_BIGRT, TG_UNDOCUMENTED, TG_SPYLOG_RAPID_CLICKS_BIGRT, TG_NN_OVER_FEATURES_USE]
Description: “Freshness of rapid clicks spy_log update, calculated at the request time”
Ticket: “USERFEAT-1493”
Authors: [“skorodumov-s”]
Responsibles: [“skorodumov-s”, “tarum”]
ImplementationTime: “2020-09-01”
}
Factor {
Index: 520
CppName: “FI_QUERY_ISGEO”
Name: “IsGeo”
DependsOn: [{Feature: [“IsGeo”], Slice: “begemot_query_factors”}]
Ticket: “BUKI-1316”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/IsGeo”
Group: “Query”
Tags: [TG_QUERY_ONLY, TG_DYNAMIC, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_DEPRECATED]
Description: “Lowers the maximum weight of the encountered geo object in the request under the name isgeo. A geo object is an object of the category Geo, Geo1, GeoAddr, GeoAddr1, LandMark, LandMark1 (see ((http://wiki.yandex-team.ru/ AlekseySokirko/QueryObjects som markup))).((http://wiki.yandex-team.ru/ArsenGadzhikurbanov/Wares More))”
Authors: “arseny”
Responsibles: “arseny”
}
Factor {
Index: 521
CppName: “FI_QUERY_ISMUSIC”
Name: “IsMusic”
DependsOn: [{Feature: [“IsMusic”], Slice: “begemot_query_factors”}]
Ticket: “BUKI-1316”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/IsMusic”
Group: “Query”
Tags: [TG_QUERY_ONLY, TG_DYNAMIC, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_DEPRECATED]
Description: “Reduces to basic searches under the name ismusic the maximum weight of the encountered object of the Music or Music1 category in the request. (See ((http://wiki.yandex-team.ru/AlekseySokirko/QueryObjects som markup))).( (http://wiki.yandex-team.ru/ArsenGadzhikurbanov/Wares More))”
Authors: “arseny”
Responsibles: “arseny”
}
Factor {
Index: 522
CppName: “FI_BCLM_LITE”
Name: “BclmLite”
Group: “BCLM”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_L2, TG_NO_L3, TG_NN_OVER_FEATURES_USE]
Description: “Modification of the Bclm2 factor, lighter for use in fastrank. The main difference is that BclmLite does not use absolute word offsets relative to the beginning of the document. Instead, the factor works with normal positions of the form <Sentence_Number, Sentence_Position>. At the same time, proximity between words is taken into account only inside the sentence.
Authors: “alsafr”
Responsibles: “alsafr”
}
Factor {
Index: 523
CppName: “FI_QUERY_NEARBY”
Name: “NearbyQuery”
DependsOn: [{Feature: [“NearbyQuery”], Slice: “begemot_query_factors”}]
Group: “Query”
Tags: [TG_QUERY_ONLY, TG_DYNAMIC, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_DEPRECATED]
Description: “When answering a query, results in the immediate vicinity are important ([pharmacies], [children’s clinics])”
Authors: “esoloviev”
Responsibles: “esoloviev”
}
Factor {
Index: 524
CppName: “FI_QUERY_CITY”
Name: “CityQuery”
DependsOn: [{Feature: [“CityQuery”], Slice: “begemot_query_factors”}]
Group: “Query”
Tags: [TG_QUERY_ONLY, TG_DYNAMIC, TG_UNDOCUMENTED, TG_L2, TG_REARR_USE, TG_DEPRECATED]
Description: “When answering a query, the results within the city are important (the bulk of localizable queries)”
Authors: “esoloviev”
Responsibles: “esoloviev”
}
Factor {
Index: 525
CppName: “FI_QUERY_ADM”
Name: “AdmQuery”
DependsOn: [{Feature: [“AdmQuery”], Slice: “begemot_query_factors”}]
Group: “Query”
Tags: [TG_QUERY_ONLY, TG_DYNAMIC, TG_UNDOCUMENTED, TG_L2, TG_REARR_USE, TG_DEPRECATED]
Description: “When answering a query, results from the user’s area, region ([airport], [dairy]) are important”
Authors: “esoloviev”
Responsibles: “esoloviev”
}
Factor {
Index: 526
CppName: “FI_NUM_LINKS_FROM_MP”
Name: “NumLinksFromMP”
Tags: [TG_DOC, TG_LINK_GRAPH, TG_STATIC, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_DEPRECATED]
Description: “Number of incoming links from snouts”
Authors: “vvp”
Responsibles: “alsafr”
}
Factor {
Index: 527
CppName: “FI_YMW_FULL2”
Name: “YmwFull2”
Group: “Combined Abs”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_REARR_USE, TG_UNDOCUMENTED, TG_NN_OVER_FEATURES_USE]
Description: “Corrected YmwFull. It differs from the previous version only in the behavior on 2-word queries. ((http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/YMW more))”
Authors: “alsafr”
Responsibles: “alsafr”
}
Factor {
Index: 528
CppName: “FI_FULL_QUORUM”
Name: “FullQuorum”
Group: “Dynamic”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_REARR_USE, TG_DEPRECATED]
Description: “Binary factor, each word of the query is in the text or in the links”
Authors: “denplusplus”
Responsibles: “alsafr”
}
Factor {
Index: 529
CppName: “FI_AUXC_TEXT_BM25”
Name: “AuxCTextBM25”
AntiSeoUpperBound: 0.8
Group: “AuxBM25”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_LOCALIZED_COUNTRY, TG_UNUSED, TG_OFTEN_ZERO]
Description: “uses ‘country aux tree’ (auxqc)”
Authors: “shutovich”
Responsibles: “shutovich”
}
Factor {
Index: 530
CppName: “FI_AUXC_LINK_BM25”
Name: “AuxCLinkBM25”
AntiSeoUpperBound: 0.8
Group: “AuxBM25”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_LOCALIZED_COUNTRY, TG_UNUSED, TG_OFTEN_ZERO]
Description: “uses ‘country aux tree’ (auxqc)”
Authors: “shutovich”
Responsibles: “shutovich”
}
Factor {
Index: 531
CppName: “FI_SOFT_404”
Name: “Soft404”
Ticket: “ARC-1046”
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “Page – ‘404’ (share of ‘404’ tokens in relation to the total number of tokens on the page)”
Authors: “avatar”
Responsibles: “avatar”
}
Factor {
Index: 532
CppName: “FI_RC_SPYLOG_URL_RATIONAL_SIGMOID_D1T240_AT_REQ”
Name: “RcSpylogUrlRationalSigmoidD1T240AtReq”
Group: “Rapid Clicks”
Tags: [TG_STATIC, TG_DOC, TG_USER, TG_BROWSER, TG_L2, TG_DATA_FROM_BIGRT, TG_UNDOCUMENTED, TG_SPYLOG_RAPID_CLICKS_BIGRT, TG_NN_OVER_FEATURES_USE]
Description: “URL feature computed at the request time from rapid clicks spy_log counters with decay of 1 day”
Ticket: “USERFEAT-1493”
Authors: [“skorodumov-s”]
Responsibles: [“skorodumov-s”, “tarum”]
ImplementationTime: “2020-09-01”
}
Factor {
Index: 533
CppName: “FI_DBM25”
Name: “DBM25”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/DBM25”
Group: “DBM25”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: “BM25 machine-matched word weight”
Authors: “denplusplus”
Responsibles: “alsafr”
}
Factor {
Index: 534
CppName: “FI_QUERY_WORD_COHESION_TR”
Name: “QueryWordCohesionTR”
Group: “Combined Abs”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_NN_OVER_FEATURES_USE]
Description: “The factor evaluates how the query words are grouped together in the text of the document, regardless of their order. ((http://wiki.yandex-team.ru/SergejjKrylov/QueryWordCohesionTR description))”
Authors: “kryloff”
Responsibles: “kryloff”
}
Factor {
Index: 535
CppName: “FI_OWNER_SESS_NORM_DUR_REG”
Name: “OwnerSessNormDuration_Reg”
Group: “RegHostStatic”
Tags: [TG_STATIC, TG_OWNER, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_L2, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_90D, TG_USERFEAT_USF, TG_2RECEPATE_D]
Countries: CNT_RELEV
Description: “nd/k normalized time to click”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty#polzovatelskiesessii”
Authors: [“cliff”, “akhropov”, “angshu”]
Responsibles: [“tarum”, “niknik”]
}
Factor {
Index: 536
CppName: “FI_RC_SPYLOG_URL_RATIONAL_SIGMOID_D0_5T30_AT_REQ”
Name: “RcSpylogUrlRationalSigmoidD0_5T30AtReq”
Group: “Rapid Clicks”
Tags: [TG_STATIC, TG_DOC, TG_USER, TG_BROWSER, TG_L2, TG_DATA_FROM_BIGRT, TG_UNDOCUMENTED, TG_SPYLOG_RAPID_CLICKS_BIGRT, TG_NN_OVER_FEATURES_USE]
Description: “URL feature computed at the request time from rapid clicks spy_log counters with decay of 0.5 days”
Ticket: “USERFEAT-1493”
Authors: [“skorodumov-s”]
Responsibles: [“skorodumov-s”, “tarum”]
ImplementationTime: “2020-09-01”
}
Factor {
Index: 537
CppName: “FI_QUERY_DOWNER_SESS_NORM_DUR_REG”
Name: “QueryDOwnerSessNormDuration_Reg”
Tags: [TG_DYNAMIC, TG_DOWNER, TG_LOCALIZED_REGION, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_USER_SEARCH_EXTERNAL, TG_UNDOCUMENTED, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_90D, TG_USERFEAT_USF, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Description: “nd/k”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty#polzovatelskiesessii”
Authors: [“cliff”, “akhropov”, “angshu”]
Responsibles: [“tarum”, “niknik”]
}
Factor {
Index: 538
CppName: “FI_QUERY_DOWNER_WEIGHT_CLICK_REG”
Name: “QueryDOwnerWeightClick_Reg”
Tags: [TG_DYNAMIC, TG_DOWNER, TG_LOCALIZED_REGION, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_USER_SEARCH_EXTERNAL, TG_UNDOCUMENTED, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_90D, TG_USERFEAT_USF, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Description: “w/k”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty#polzovatelskiesessii”
Authors: [“cliff”, “akhropov”, “angshu”]
Responsibles: [“tarum”, “niknik”]
}
Factor {
Index: 539
CppName: “FI_QUERY_DOWNER_ONLY_CLICK_RATE_REG”
Name: “QueryDOwnerOnlyClickRate_Reg”
Tags: [TG_DYNAMIC, TG_DOWNER, TG_LOCALIZED_REGION, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_USER_SEARCH_EXTERNAL, TG_UNDOCUMENTED, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_90D, TG_USERFEAT_USF, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Description: “o/i”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty#polzovatelskiesessii”
Authors: [“cliff”, “akhropov”, “angshu”]
Responsibles: [“tarum”, “niknik”]
}
Factor {
Index: 540
CppName: “FI_QUERY_DOWNER_CLICK_SUMMARY_REG”
Name: “QueryDOwnerClickSummary_Reg”
Ticket: “BUKI-955”
Tags: [TG_DYNAMIC, TG_DOWNER, TG_LOCALIZED_REGION, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_USER_SEARCH_EXTERNAL, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_90D, TG_USERFEAT_USF, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Description: “matched formula”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty#polzovatelskiesessii”
Authors: [“popescul”, “cliff”, “angshu”, “akhropov”]
Responsibles: [“tarum”, “niknik”]
}
Factor {
Index: 541
CppName: “FI_QUERY_DOWNER_SATISFIED4_RATE_REG”
Name: “QueryDOwnerSatisfied4Rate_Reg”
Ticket: “BUKI-955”
Tags: [TG_DYNAMIC, TG_DOWNER, TG_LOCALIZED_REGION, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_USER_SEARCH_EXTERNAL, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_90D, TG_USERFEAT_USF, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Description: “r_s4b/(r_k + 10)”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty#polzovatelskiesessii”
Authors: [“popescul”, “cliff”, “angshu”, “akhropov”]
Responsibles: [“tarum”, “niknik”]
}
Factor {
Index: 542
CppName: “FI_SEGMENT_AUX_ALPHAS_IN_TEXT”
Name: “SegmentAuxAlphasInText”
Ticket: “BUKI-1109”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/SegmentAuxAlphasInText”
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “Number of letters in the Aux segment”
Authors: “avatar”
Responsibles: “avatar”
}
Factor {
Index: 543
CppName: “FI_SEGMENT_AUX_SPACES_IN_TEXT”
Name: “SegmentAuxSpacesInText”
Ticket: “BUKI-1109”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/SegmentAuxSpacesInText”
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “Number of spaces in the Aux segment”
Authors: “avatar”
Responsibles: “avatar”
}
Factor {
Index: 544
CppName: “FI_SEGMENT_CONTENT_COMMAS_IN_TEXT”
Name: “SegmentContentCommasInText”
Ticket: “BUKI-1109”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/SegmentContentCommasInText”
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “Number of commas in the Content segment”
Authors: “avatar”
Responsibles: “avatar”
}
Factor {
Index: 545
CppName: “FI_CLASSIF_IS_SHOP”
Name: “IsShop”
Ticket: “BUKI-1128”
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_DEPRECATED, TG_L2]
Description: “Page is a shop. ((http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/OpisanijaFaktorov#isshop description)) Not used (deprecated)”
Authors: “smikler”
Responsibles: “smikler”
}
Factor {
Index: 546
CppName: “FI_LR_GEO_RELEV_REGION_NATDOM”
Name: “XLRGeoRelevRegionNatDomain”
Group: “Xref”
Tags: [TG_DYNAMIC, TG_LOCALIZED_COUNTRY, TG_LINK_GRAPH, TG_UNDOCUMENTED, TG_LINK_TEXT, TG_DEPRECATED]
Authors: “agorodilov”
Responsibles: “agorodilov”
}
Factor {
Index: 547
CppName: “FI_AURA_DOC_LOG_ORIGIN”
Name: “AuraDocLogOrigin”
Tags: [TG_DOC_TEXT, TG_OWNER, TG_STATIC, TG_REARR_USE, TG_UNUSED, TG_OFTEN_ZERO, TG_DEPRECATED]
Description: “Logarithm of the number of shingles in the document added by the site owner as original texts in ((http://wiki.yandex-team.ru/JandeksPoisk/Jekosistema/MarketingPR/Webmasters/plan/vtorcontect Originality Plugin)). Does not participate in the formula , needed to re-arrange duplicates”
Authors: “antonovvk”
Responsibles: [“antonovk”, “smax”]
}
Factor {
Index: 548
CppName: “FI_AURA_DOC_MEAN_FLT_AUTHOR_SOURCE”
Name: “AuraDocMeanFltAuthorSource”
Tags: [TG_DOC_TEXT, TG_OWNER, TG_STATIC, TG_UNUSED, TG_DEPRECATED]
Description: “Average filtered number of document authorship sources. Not included in the formula, needed to re-rank duplicates”
Authors: “antonovvk”
Responsibles: [“antonovk”, “smax”]
}
Factor {
Index: 549
CppName: “FI_QUERY_REF_TRIGRAM_Q”
Name: “QueryRefTrigramQuery”
Ticket: “BUKI-1117”
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: “((http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/OpisanijaFaktorov#queryreftrigrams description))”
Authors: “vvp”
Responsibles: [“mbusel”, “tsimkha”]
}
Factor {
Index: 550
CppName: “FI_QUERY_REF_TRIGRAM_R”
Name: “QueryRefTrigramReferences”
Ticket: “BUKI-1117”
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: “((http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/OpisanijaFaktorov#queryreftrigrams description))”
Authors: “vvp”
Responsibles: [“mbusel”, “tsimkha”]
}
Factor {
Index: 551
CppName: “FI_IDF_VARIANCE”
Name: “IdfVariance”
Group: “Dynamic”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_NN_OVER_FEATURES_USE]
Description: “IDF variance of query words given text hits in the document (mixed query-text factor)”
Authors: “grechnik”
Responsibles: “greek”
}
Factor {
Index: 552
CppName: “FI_URL_NGRAMS_MODEL”
Name: “UrlNGramsModel”
Ticket: “BUKI-1145”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/UrlNGramsModel”
Tags: [TG_DOC, TG_STATIC, TG_URL_TEXT, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “Ranking factor UrlNGramsModel in erf”
Authors: “avatar”
Responsibles: “avatar”
}
Factor {
Index: 553
CppName: “FI_NATIONAL_LANGUAGE”
Name: “NationalLanguage”
Tags: [TG_LOCALIZED_COUNTRY, TG_DYNAMIC, TG_DOC_TEXT, TG_BINARY, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_L3_OVERWRITE, TG_NN_OVER_FEATURES_USE]
Description: “The language of the document matches the country of the request”
Authors: “dremov”
Responsibles: “dremov”
}
Factor {
Index: 554
CppName: “FI_OWNER_IS_COMMERCIAL”
Name: “OwnerIsCommercial”
Ticket: “SEARCHSPAM-2603”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/HostIsCommercial”
Tags: [TG_STATIC, TG_OWNER, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_COMMERCIAL, TG_OFTEN_ZERO, TG_L2, TG_DEPRECATED]
Authors: [“anelyubin”, “sisoid”]
Responsibles: [“anelyubin”, “sisoid”]
}
Factor {
Index: 555
CppName: “FI_GEO_COUNTRY_URL_REGION_COUNTRY”
Name: “GeoCountryUrlRegionCountry”
Tags: [TG_DOC, TG_DYNAMIC, TG_LOCALIZED_COUNTRY, TG_URL_TEXT, TG_BINARY, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Authors: “denplusplus”
Responsibles: “alsafr”
}
Factor {
Index: 556
CppName: “FI_GEO_COUNTRY_URL_GEO_COUNTRY”
Name: “GeoCountryUrlGeoCountry”
Tags: [TG_DOC, TG_DYNAMIC, TG_LOCALIZED_GEOINQUERY, TG_URL_TEXT, TG_BINARY, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Authors: “denplusplus”
Responsibles: “alsafr”
}
Factor {
Index: 557
CppName: “FI_NUM_LINKS_FROM_SEGMENT_CONTENT”
Name: “NumLinksFromSegmentContent”
Ticket: “BUKI-1161”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/NumLinksFromSegmentContent”
Group: “Xref”
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_DEPRECATED]
Authors: “vvp”
Responsibles: “alsafr”
}
Factor {
Index: 558
CppName: “FI_LOCM”
Name: “Locm”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/Locm”
Group: “Xref”
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: “Word order in links.”
Authors: “alsafr”
Responsibles: “alsafr”
}
Factor {
Index: 559
CppName: “FI_URL_QUERY_VARIETY_REG”
Name: “UrlQueryVariety_Reg”
Ticket: “BUKI-1159”
Group: “RegDocStatic”
Tags: [TG_STATIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_L2, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_90D, TG_USERFEAT_CLICKS_SHOWS, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Countries: CNT_RELEV
Description: “The degree of diversity of requests that are clicked on this url is calculated by region”
Wiki: “https://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/Kliki#urlqueryvarietyreg”
Authors: “akhropov”
Responsibles: [“tarum”, “niknik”]
}
Factor {
Index: 560
CppName: “FI_URL_SESS_NORM_DUR_RATE_REG”
Name: “UrlSessNormDurRate_Reg”
Ticket: “BUKI-1159”
Group: “RegDocStatic”
Tags: [TG_STATIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_L2, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_90D, TG_USERFEAT_USF, TG_FORMULA_D]
Countries: CNT_RELEV
Description: “nd/i”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty#polzovatelskiesessii”
Authors: [“cliff”, “akhropov”, “angshu”]
Responsibles: [“tarum”, “niknik”]
}
Factor {
Index: 561
CppName: “FI_FILTRATION_SEGMENTS”
Name: “FiltrationSegments”
Group: “Combined Abs”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_REARR_USE, TG_NN_OVER_FEATURES_USE]
Description: “Percentage of query segments present in text”
Authors: “denplusplus”
Responsibles: “alsafr”
}
Factor {
Index: 562
CppName: “FI_LANGUAGE_GOOD_FOR_TURKEY”
Name: “LanguageGoodForTurkey”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “The language of the document is one of the allowed ones for Turkey (Turkish, English, German, French, Arabic, Azeri) or the document has zero length. Only IsRealGeoLocal queries are calculated at the search stage.”
Authors: “dremov”
Responsibles: “dremov”
}
Factor {
Index: 563
CppName: “FI_DBM25_2”
Name: “DBM25_2”
Group: “DBM25”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_REARR_USE, TG_NN_OVER_FEATURES_USE]
Description: “Variation on the theme ((http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/DBM25 DBM25)), see ysite/yandex/relevance/dbm25.cpp”
Authors: “denplusplus”
Responsibles: “alsafr”
}
Factor {
Index: 564
CppName: “FI_GEO_DISPERSION”
Name: “GeoDispersion”
Tags: [TG_DOC, TG_LINK_GRAPH, TG_STATIC, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_UNUSED]
Description: “Dispersion of document link regions”
Authors: “bochkarev”
Responsibles: “bochkarev”
}
Factor {
Index: 565
CppName: “FI_QUERY_DOWNER_ENOUGH_CLICKED”
Name: “QueryDownerEnoughClicked”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/QueryDownerEnoughClicked”
Tags: [TG_DYNAMIC, TG_DOWNER, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_USER_SEARCH_EXTERNAL, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_USF, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Description: “The number of clicks on the owner and the number of clicks on the request is greater than 5”
Authors: [“snailer”, “akhropov”]
Responsibles: [“tarum”, “niknik”]
}
Factor {
Index: 566
CppName: “FI_BM25F_DPR_FIXED”
Name: “BM25FdPRFixed”
Group: “BM25F”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_L2, TG_LINK_TEXT, TG_DEPRECATED]
Description: “BM25FdPR normalized to the average document length depending on the language of the document. ((http://wiki.yandex-team.ru/BM25FRework Test results.))”
Authors: “lamo”
Responsibles: “lamo”
}
Factor {
Index: 567
CppName: “FI_LANG_POPULARITY”
Name: “LanguagePopularity”
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “Document language popularity. A number from 0 to 1. ((http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/LanguagePopularity LanguagePopularity))”
Authors: “lamo”
Responsibles: “lamo”
}
Factor {
Index: 568
CppName: “FI_QUERY_DOWNER_WS_FRC_AND_BM25F_DPR_FIXED”
Name: “QueryDOwnerWeightedSumFRCAndBM25FdPRFixed”
Tags: [TG_DEPRECATED, TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_DOWNER, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_DOC_TEXT, TG_TRANS, TG_USER_SEARCH_EXTERNAL, TG_UNUSED, TG_L2]
Countries: CNT_RELEV
Description: “The sum of the QueryDOwnerClicksFRC and BM25FdPRFixed factors with weights 0.358449 and 0.184922 respectively. The ‘565’ in the factor name should not be taken literally, it’s a legacy or a typo.”
Authors: [“grechnik”, “kustarev”]
Responsibles: “greek”
DependsOn: [{Feature: [“QueryDOwnerClicksFRC”, “BM25FdPRFixed”]}]
}
Factor {
Index: 569
CppName: “FI_QUERY_DOWNER_WS_MAX_WHR_AND_ONLY_CLICK_RATE”
Name: “QueryDOwnerWeightedSumMaxWHRAndOnlyClickRate”
Tags: [TG_DEPRECATED, TG_DYNAMIC, TG_DOWNER, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_TRANS, TG_USER_SEARCH_EXTERNAL, TG_UNUSED]
Countries: CNT_RELEV
Description: “The sum of factors 192 and 341 with weights 0.298942 and 0.454625 respectively.”
Authors: [“grechnik”, “kustarev”]
Responsibles: “greek”
DependsOn: [{Feature: [“MaxWordHostRank”, “QueryDOwnerOnlyClickRate”]}]
}
Factor {
Index: 570
CppName: “FI_RC_SPYLOG_URL_RATIONAL_SIGMOID_D3T120_AT_REQ”
Name: “RcSpylogUrlRationalSigmoidD3T120AtReq”
Group: “Rapid Clicks”
Tags: [TG_STATIC, TG_DOC, TG_USER, TG_BROWSER, TG_L2, TG_DATA_FROM_BIGRT, TG_UNDOCUMENTED, TG_SPYLOG_RAPID_CLICKS_BIGRT, TG_NN_OVER_FEATURES_USE]
Description: “URL feature computed at the request time from rapid clicks spy_log counters with decay of 3 days”
Ticket: “USERFEAT-1493”
Authors: [“skorodumov-s”]
Responsibles: [“skorodumov-s”, “tarum”]
ImplementationTime: “2020-09-01”
}
Factor {
Index: 571
CppName: “FI_RC_SPYLOG_URL_RATIONAL_SIGMOID_D14T300_AT_REQ”
Name: “RcSpylogUrlRationalSigmoidD14T300AtReq”
Group: “Rapid Clicks”
Tags: [TG_STATIC, TG_DOC, TG_USER, TG_BROWSER, TG_L2, TG_DATA_FROM_BIGRT, TG_UNDOCUMENTED, TG_SPYLOG_RAPID_CLICKS_BIGRT, TG_NN_OVER_FEATURES_USE]
Description: “URL feature computed at the request time from rapid clicks spy_log counters with decay of 14 days”
Ticket: “USERFEAT-1493”
Authors: [“skorodumov-s”]
Responsibles: [“skorodumov-s”, “tarum”]
ImplementationTime: “2020-09-01”
}
Factor {
Index: 572
CppName: “FI_TOCM”
Name: “Tocm”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/Tocm”
Group: “Tocm”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_NN_OVER_FEATURES_USE]
Description: “The factor evaluates the differences between the positions of words in the title and the positions of words in the query”
Authors: “alsafr”
Responsibles: “alsafr”
}
Factor {
Index: 573
CppName: “FI_RELEV_GEO_LINKS_PERCENT”
Name: “RelevGeoLinksPercent”
Tags: [TG_DOC, TG_DYNAMIC, TG_LOCALIZED_CITY, TG_LINK_GRAPH, TG_UNDOCUMENTED, TG_UNUSED]
Authors: “denplusplus”
Responsibles: “alsafr”
}
Factor {
Index: 574
CppName: “FI_LANG_DISPERSION”
Name: “LangDispersion”
Ticket: “BUKI-1228”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/LangDispersion”
Tags: [TG_DOC, TG_LINK_GRAPH, TG_STATIC, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_UNUSED]
Description: “Dispersion of languages in xmap”
Authors: “kartynnik”
Responsibles: “kartynnik”
}
Factor {
Index: 575
CppName: “FI_HAS_MISSPELL”
Name: “HasMisspell”
DependsOn: [{Feature: [“HasMisspell”], Slice: “begemot_query_factors”}]
Group: “Query”
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_UNDOCUMENTED, TG_L2, TG_DEPRECATED]
Description: “There is a typo in the request”
Authors: “denplusplus”
Responsibles: “alsafr”
}
Factor {
Index: 576
CppName: “FI_DBM30_SMERCH”
Name: “DBM30Smerch”
Group: “DBM25”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_NN_OVER_FEATURES_USE]
Description: “Variation on the theme ((http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/DBM25 DBM25)), see ysite/yandex/relevance/dbm25.cpp”
Authors: “denplusplus”
Responsibles: “alsafr”
}
Factor {
Index: 577
CppName: “FI_IS_URL_FOR_CLICK_DEBOOST”
Name: “IsUrlForClickDeboost”
Tags: [TG_STATIC, TG_DOC, TG_UNUSED, TG_OFTEN_ZERO, TG_REARR_USE, TG_DATA_FROM_SAASKV, TG_USED_IN_CONF_REARR]
Authors: “hommforever”
Responsibles: [“hommforever”, “ilnurkh”]
Description: “Url is known to show too often with very low relevance (by burt and/or by bm25)”
ImplementationTime: “2021-01-12”
}
Factor {
Index: 578
CppName: “FI_URL_LINK_PERCENT”
Name: “UrlLinkPercent”
Ticket: “BUKI-1233”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/UrlLinkPercent”
Tags: [TG_DOC, TG_LINK_GRAPH, TG_STATIC, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_UNUSED]
Description: “The ratio of the number of incoming links whose text is a URL to the number of all incoming links”
Authors: “suncpp”
Responsibles: “alsafr”
}
Factor {
Index: 579
CppName: “FI_DSSM_BERT_DISTILL_L2”
Name: “DssmBertDistillL2”
Tags: [TG_DYNAMIC, TG_DOC, TG_USER, TG_USER_SEARCH, TG_URL_TEXT, TG_DOC_TEXT, TG_NEURAL, TG_USE_MARKUP, TG_ALL_RELEVANCE_MARKUP, TG_SIN_SIG_MARKUP, TG_BERT_DISTILL, TG_L2]
Description: “A pool of PRS logs is marked up using Bert trained on sinsig. A dssm model is trained on this pool using BaseRegionChain”
UseArtifact: {Name: “DssmBertDistillL2”}
Ticket: “BERT-179”
Authors: [“film”]
Responsibles: [“movies”]
ImplementationTime: “2020-08-30”
}
Factor {
Index: 580
CppName: “FI_NUM_NON_LETTERS_IN_URL”
Name: “NumNonLettersInUrl”
Ticket: “BUKI-1238”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/NumNonLettersInUrl”
Tags: [TG_DOC, TG_STATIC, TG_URL_TEXT, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “Number of ‘non-letters’ in url”
Authors: “kartynnik”
Responsibles: “kartynnik”
}
Factor {
Index: 581
CppName: “FI_URL_LENGTH_2”
Name: “UrlLen2”
Tags: [TG_DOC, TG_STATIC, TG_URL_TEXT, TG_UNUSED, TG_L2]
Ticket: “BUKI-1252”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/UrlLen2”
Description: “Length of the URL to the nearest character. Disabled in production.”
Authors: “kartynnik”
Responsibles: “kartynnik”
}
Factor {
Index: 582
CppName: “FI_IS_HUB”
Name: “IsHub”
Ticket: “BUKI-1257”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/IsHub”
Tags: [TG_DOC, TG_STATIC, TG_BINARY, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_NN_OVER_FEATURES_USE]
Description: “Hub page”
Authors: “suncpp”
Responsibles: “alsafr”
}
Factor {
Index: 583
CppName: “FI_STATIC_TITLE_COMM”
Name: “StaticTitleComm”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/StaticTitleComm”
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_DEPRECATED, TG_OFTEN_ZERO]
Description: “The degree of commerciality of the page title. Not used (deprecated)”
Authors: “zosimov”
Responsibles: “zosimov”
}
Factor {
Index: 584
CppName: “FI_STATIC_TITLE_BM25_EX”
Name: “StaticTitleBM25Ex”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/StaticTitleBM25Ex”
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “BM25 page title by page text”
Authors: “zosimov”
Responsibles: “zosimov”
}
Factor {
Index: 585
CppName: “FI_STATIC_TITLE_LR_BM25”
Name: “StaticTitleLRBM25”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/StaticTitleLRBM25”
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_UNUSED]
Description: “BM25 page title by link text”
Authors: “zosimov”
Responsibles: “zosimov”
}
Factor {
Index: 586
CppName: “FI_SEO_IN_PAY_LINKS”
Name: “SeoInPayLinks”
Ticket: “BUKI-1243”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/SeoInPayLinks”
Tags: [TG_DOC, TG_LINK_GRAPH, TG_STATIC, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_UNUSED]
Description: “Number of incoming seo trash links between hosts”
Authors: “suncpp”
Responsibles: “alsafr”
}
Factor {
Index: 587
CppName: “FI_US_LONG_PERIOD_URL_MOBILE_DT180_AVG”
Name: “USLongPeriodUrlMobileDt180Avg”
Ticket: [“FACTOR-1129”]
Tags: [TG_DOC, TG_STATIC, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_1600D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_SEARCH_DW]
Description: “Static URL factor for search sessions over 1600 days calculated from mobile sessions. Average DwellTime, with DwellTime from the session truncated if greater than 180 seconds”
Wiki: “https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/USLongPeriodUrlFactors”
Authors: [“edik”]
Responsibles: [“edik”, “tarum”, “niknik”]
}
Factor {
Index: 588
CppName: “FI_US_LONG_PERIOD_URL_MOBILE_LONG_CLICK_PROB”
Name: “USLongPeriodUrlMobileLongClickProb”
Ticket: [“FACTOR-1129”]
Tags: [TG_DOC, TG_STATIC, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_1600D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_SEARCH_DW]
Description: “Static URL factor for search sessions for 1600 days calculated for mobile sessions. Probability that a URL click will be more than 120 seconds”
Wiki: “https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/USLongPeriodUrlFactors”
Authors: [“edik”]
Responsibles: [“edik”, “tarum”, “niknik”]
}
Factor {
Index: 589
CppName: “FI_US_LONG_PERIOD_URL_MOBILE_LOSSES_PROB”
Name: “USLongPeriodUrlMobileLossesProb”
Ticket: [“FACTOR-1129”]
Tags: [TG_DOC, TG_STATIC, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_1600D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_CLICK_MACHINE]
Description: “Static URL factor for search sessions over 1600 days calculated from mobile sessions. Probability of a URL not being clicked if at least one URL is clicked below.”
Wiki: “https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/USLongPeriodUrlFactors”
Authors: [“edik”]
Responsibles: [“edik”, “tarum”, “niknik”]
}
Factor {
Index: 590
CppName: “FI_US_LONG_PERIOD_URL_MOBILE_DT3600_AVG_REG”
Name: “USLongPeriodUrlMobileDt3600AvgReg”
Ticket: [“FACTOR-1129”]
Tags: [TG_DOC, TG_STATIC, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_LOCALIZED_COUNTRY, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_1600D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_SEARCH_DWELL_TIME, TG_USERFEAT_CLICK_MACHINE]
Countries: CNT_RELEV
Description: “Static URL factor for search sessions over 1600 days calculated from mobile sessions. Average DwellTime, with session DwellTime truncated if greater than 3600 seconds. Localized to country level.”
Group: “RegDocStatic”
Wiki: “https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/USLongPeriodUrlFactors”
Authors: [“edik”]
Responsibles: [“edik”, “tarum”, “niknik”]
}
Factor {
Index: 591
CppName: “FI_US_LONG_PERIOD_URL_MOBILE_DT180_AVG_REG”
Name: “USLongPeriodUrlMobileDt180AvgReg”
Ticket: [“FACTOR-1129”]
Tags: [TG_DOC, TG_STATIC, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_LOCALIZED_COUNTRY, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_1600D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_SEARCH_DWELL_TIME, TG_USERFEAT_CLICK_MACHINE]
Countries: CNT_RELEV
Description: “Static URL factor for search sessions over 1600 days calculated from mobile sessions. Average DwellTime, with session DwellTime truncated if greater than 180 seconds. Localized to country level.”
Group: “RegDocStatic”
Wiki: “https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/USLongPeriodUrlFactors”
Authors: [“edik”]
Responsibles: [“edik”, “tarum”, “niknik”]
}
Factor {
Index: 592
CppName: “FI_HP_DETECTOR_PREDICT”
Name: “HpDetectorPredict”
Ticket: “COMMERCIAL-45”
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_USER, TG_L2, TG_QUERY_DETECTOR_PREDICT, TG_NOT_01, TG_UNUSED]
Description: “The value of the health detector calculated in the behemoth.”
MinValue: -10
MaxValue: 10
Authors: [“alejes”, “hygge”]
Responsibles: [“alejes”, “hygge”]
ImplementationTime: “2020-09-25”
}
Factor {
Index: 593
CppName: “FI_IS_FEED_LISTING”
Name: “IsFeedListing”
Ticket: “SEARCHSPAM-15486”
Authors: [“bikulov”]
Responsibles: [“bikulov”, “ulyanov”]
Description: “OffersBase feature for ecoboost.”
Tags: [TG_DOC, TG_STATIC, TG_BINARY, TG_OFTEN_ZERO, TG_META_OVERWRITE, TG_UNUSED, TG_DATA_FROM_SAASKV, TG_UNIMPLEMENTED],
}
Factor {
Index: 594
CppName: “FI_IS_FEED_MAIN”
Name: “IsFeedMain”
Ticket: “SEARCHSPAM-15486”
Authors: [“bikulov”]
Responsibles: [“bikulov”, “ulyanov”]
Description: “OffersBase feature for ecoboost.”
Tags: [TG_DOC, TG_STATIC, TG_BINARY, TG_OFTEN_ZERO, TG_META_OVERWRITE, TG_UNUSED, TG_DATA_FROM_SAASKV, TG_UNIMPLEMENTED],
}
Factor {
Index: 595
CppName: “FI_IS_FEED_STRATOCASTER”
Name: “IsFeedStratocaster”
Ticket: “SEARCHSPAM-15486”
Authors: [“bikulov”]
Responsibles: [“bikulov”, “ulyanov”]
Description: “OffersBase feature for ecoboost.”
Tags: [TG_DOC, TG_STATIC, TG_BINARY, TG_OFTEN_ZERO, TG_META_OVERWRITE, TG_UNUSED, TG_DATA_FROM_SAASKV, TG_UNIMPLEMENTED],
}
Factor {
Index: 596
CppName: “FI_IS_FEED_ANY”
Name: “IsFeedAny”
Ticket: “SEARCHSPAM-15486”
Authors: [“bikulov”]
Responsibles: [“bikulov”, “ulyanov”]
Description: “OffersBase feature for ecoboost.”
Tags: [TG_DOC, TG_STATIC, TG_BINARY, TG_OFTEN_ZERO, TG_META_OVERWRITE, TG_UNUSED, TG_DATA_FROM_SAASKV, TG_UNIMPLEMENTED],
}
Factor {
Index: 597
CppName: “FI_TITLE_IN_LINKS_TRIGRAMS”
Name: “TitleInLinksTrigrams”
Ticket: “BUKI-1264”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/titleinlinkstrigrams”
Tags: [TG_DOC, TG_DOC_TEXT, TG_LINK_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_UNUSED]
Description: “Proportion of unique title trigrams in link trigrams”
Authors: “morph”
Responsibles: “morph”
}
Factor {
Index: 598
CppName: “FI_LINKS_IN_TITLE_TRIGRAMS”
Name: “LinksInTitleTrigrams”
Ticket: “BUKI-1264”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/titleinlinkstrigrams”
Tags: [TG_DOC, TG_DOC_TEXT, TG_LINK_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_UNUSED]
Description: “Proportion of unique link trigrams in title trigrams”
Authors: “morph”
Responsibles: “morph”
}
Factor {
Index: 599
CppName: “FI_TRASH_ADV”
Name: “TrashAdv”
Ticket: “SEARCH-254”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/Antispam/AntiTrash/adv/TrashAdvFactor”
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “Page Ads”
Authors: “vvp”
Responsibles: “alsafr”
}
Factor {
Index: 600
CppName: “FI_METRIKA_URL_VISITS”
Name: “MetrikaUrlVisits”
Ticket: [“BUKI-1148”, “BUKI-1274”]
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/MetrikaUrlVisits”
Tags: [TG_STATIC, TG_DOC, TG_USER, TG_COUNTER, TG_METRIKA, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_30D, TG_NN_OVER_FEATURES_USE]
Description: “Similar to YabarUrlVisits”
Authors: “smikler”
Responsibles: [“smikler”, “tarum”, “niknik”]
}
Factor {
Index: 601
CppName: “FI_URLGEO_ADMS”
Name: “UrlGeoAdms”
Ticket: “QREG-23”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/geo/RegNavQueries”
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_REGION, TG_URL_TEXT, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: “The URL of the document corresponds to the region (area) of the user ((http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/geo/RegNavQueries /JandeksPoisk/KachestvoPoiska/geo/RegNavQueries))”
Authors: “esoloviev”
Responsibles: “esoloviev”
}
Factor {
Index: 602
CppName: “FI_URLGEO_CITY”
Name: “UrlGeoCity”
Ticket: “QREG-23”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/geo/RegNavQueries”
Tags: [TG_DOC, TG_DYNAMIC, TG_LOCALIZED_CITY, TG_UNUSED]
Description: “Document URL matches the user’s city”
Authors: “esoloviev”
Responsibles: “esoloviev”
}
Factor {
Index: 603
CppName: “FI_REG_NAV_QUERY”
Name: “RegNavQuery”
DependsOn: [{Feature: [“RegNavQuery”], Slice: “begemot_query_factors”}]
Ticket: “QREG-23”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/geo/RegNavQueries”
Group: “Query”
Tags: [TG_QUERY_ONLY, TG_DYNAMIC, TG_LOCALIZED_CITY, TG_UNDOCUMENTED, TG_L2, TG_DEPRECATED]
Description: “Regional navigation query – the user’s region has one or more navigation results for it”
Authors: “esoloviev”
Responsibles: “esoloviev”
}
Factor {
Index: 604
CppName: “FI_YABAR_URL_LCAC”
Name: “YabarUrlLcAc”
Ticket: “BUKI-1295”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/YabarUrlLcAc”
Tags: [TG_STATIC, TG_DOC, TG_USER, TG_BROWSER, TG_REARR_USE, TG_L2, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_VISITS_ACTIVITY_DOWNLOADS]
Description: “Number of sessions in which the url was last, divided by the number of sessions in which the url appeared”
Authors: “snailer”
Responsibles: [“tarum”, “niknik”]
}
Factor {
Index: 605
CppName: “FI_SOWNER_MAX_SUM_SOURCE_RANK”
Name: “SOMaxSumSourceRank”
Ticket: “BUKI-1214”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/SOMaxSumSourceRank”
Tags: [TG_DOC, TG_LINK_GRAPH, TG_STATIC, TG_USER, TG_BROWSER, TG_COUNTER, TG_USER_SEARCH, TG_USER_EXT_DATA, TG_TRANS, TG_UNDOCUMENTED, TG_L2, TG_UNUSED]
Description: “The sum of the maximum SourceRanks for each incoming link, taking into account the uniqueness of the owner.”
Authors: “vvp”
Responsibles: “alsafr”
}
Factor {
Index: 606
CppName: “FI_DBM35”
Name: “DBM35”
Ticket: “BUKI-1303”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/DBM35”
Group: “DBM25”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_REARR_USE, TG_UNDOCUMENTED, TG_LINK_TEXT, TG_DEPRECATED]
Description: “BM25 for texts and links with special weights for matching level (form, lemma, synonym)”
Authors: “denplusplus”
Responsibles: “alsafr”
}
Factor {
Index: 607
CppName: “FI_TRLR_QUORUM_FM”
Name: “TRLRQuorumFm”
Ticket: “BUKI-1303”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/DBM35”
Group: “TextAndLinkBM25”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_L2, TG_REARR_USE, TG_LINK_TEXT, TG_DEPRECATED]
Description: “The weight of the query words that are in the text in the exact form”
Authors: “denplusplus”
Responsibles: “alsafr”
}
Factor {
Index: 608
CppName: “FI_TRLR_QUORUM_LEMMA”
Name: “TRLRQuorumLemma”
Ticket: “BUKI-1303”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/DBM35”
Group: “TextAndLinkBM25”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_LINK_TEXT, TG_DEPRECATED]
Description: “The weight of the query words that are in the text up to the lemma”
Authors: “denplusplus”
Responsibles: “alsafr”
}
Factor {
Index: 609
CppName: “FI_TRLR_QUORUM_SYN”
Name: “TRLRQuorumSyn”
Ticket: “BUKI-1303”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/DBM35”
Group: “TextAndLinkBM25”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_LINK_TEXT, TG_DEPRECATED]
Description: “The weight of the query words that are in the text”
Authors: “denplusplus”
Responsibles: “alsafr”
}
Factor {
Index: 610
CppName: “FI_QUERY_ISHUM”
Name: “IsHum”
DependsOn: [{Feature: [“IsHum”], Slice: “begemot_query_factors”}]
Ticket: “BUKI-1316”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/IsHum”
Group: “Query”
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_DEPRECATED]
Description: “Reduces the maximum weight of the encountered object of the category Hum or Hum1 in the request to the base searches under the name ishum. (See ((http://wiki.yandex-team.ru/AlekseySokirko/QueryObjects som markup))).( (http://wiki.yandex-team.ru/ArsenGadzhikurbanov/Wares#ishum More))”
Authors: “arseny”
Responsibles: “arseny”
}
Factor {
Index: 611
CppName: “FI_QUERY_ISTEXT”
Name: “IsText”
DependsOn: [{Feature: [“IsText”], Slice: “begemot_query_factors”}]
Ticket: “BUKI-1316”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/IsText”
Group: “Query”
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_DEPRECATED]
Description: “Reduces to basic searches under the name istext the maximum weight of the encountered object of the category Text or Text1 in the request. (See ((http://wiki.yandex-team.ru/AlekseySokirko/QueryObjects som markup))).( (http://wiki.yandex-team.ru/ArsenGadzhikurbanov/Wares#istext More))”
Authors: “arseny”
Responsibles: “arseny”
}
Factor {
Index: 612
CppName: “FI_QUERY_ISPICTURE”
Name: “IsPicture”
DependsOn: [{Feature: [“IsPicture”], Slice: “begemot_query_factors”}]
Ticket: “BUKI-1316”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/IsPicture”
Group: “Query”
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_DEPRECATED]
Description: “Reduces the maximum weight of the encountered object of the Picture or Picture1 category in the request to the base searches under the name ispicture. (See ((http://wiki.yandex-team.ru/AlekseySokirko/QueryObjects som markup))).( (http://wiki.yandex-team.ru/ArsenGadzhikurbanov/Wares#ispicture More))”
Authors: “arseny”
Responsibles: “arseny”
}
Factor {
Index: 613
CppName: “FI_QUERY_MAXONE”
Name: “MaxOne”
DependsOn: [{Feature: [“MaxOne”], Slice: “begemot_query_factors”}]
Ticket: “BUKI-1316”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/MaxOne”
Group: “Query”
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_DEPRECATED]
Description: “Returns, under the name wmaxone, the maximum degree of commonality of encountered objects in the request. (See ((http://wiki.yandex-team.ru/AlekseySokirko/QueryObjects som markup))).((http://wiki .yandex-team.ru/ArsenGadzhikurbanov/Wares#maxone More))”
Authors: “arseny”
Responsibles: “arseny”
}
Factor {
Index: 614
CppName: “FI_QUERY_MINONE”
Name: “MinOne”
DependsOn: [{Feature: [“MinOne”], Slice: “begemot_query_factors”}]
Ticket: “BUKI-1316”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/MinOne”
Group: “Query”
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_DEPRECATED]
Description: “Returns, under the name wminone, the maximum degree of nominality of encountered objects in the request. (See ((http://wiki.yandex-team.ru/AlekseySokirko/QueryObjects som markup))).((http://wiki .yandex-team.ru/ArsenGadzhikurbanov/Wares#minone More))”
Authors: “arseny”
Responsibles: “arseny”
}
Factor {
Index: 615
CppName: “FI_OQ_BM25_STR”
Name: “OqBm25Str”
Ticket: [“BUKI-1185”, “BUKI-1270”, “BUKI-1311”, “BETATEST-2194”]
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/OqBm25Str”
Tags: [TG_DYNAMIC, TG_DOWNER, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_DEPRECATED, TG_OFTEN_ZERO]
Description: “Bm25 by query index for domAttr”
Authors: [“agorodilov”, “vvp”]
Responsibles: [“agorodilov”, “alsafr”]
}
Factor {
Index: 616
CppName: “FI_OQ_BM25_LEM”
Name: “OqBm25Lem”
Ticket: [“BUKI-1185”, “BUKI-1270”, “BUKI-1311”, “BETATEST-2194”]
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/OqBm25Lem”
Tags: [TG_DYNAMIC, TG_DOWNER, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_DEPRECATED, TG_OFTEN_ZERO]
Description: “Bm25 by query index for domAttr”
Authors: [“agorodilov”, “vvp”]
Responsibles: [“agorodilov”, “alsafr”]
}
Factor {
Index: 617
CppName: “FI_OQ_BM25_SYN”
Name: “OqBm25Syn”
Ticket: [“BUKI-1185”, “BUKI-1270”, “BUKI-1311”, “BETATEST-2194”]
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/OqBm25Syn”
Tags: [TG_DYNAMIC, TG_DOWNER, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_DEPRECATED, TG_OFTEN_ZERO]
Description: “Bm25 by query index for domAttr”
Authors: [“agorodilov”, “vvp”]
Responsibles: [“agorodilov”, “alsafr”]
}
Factor {
Index: 618
CppName: “FI_OQ_BCLM_WEIGHTED”
Name: “OqBclmWeighted”
Ticket: [“BUKI-1185”, “BUKI-1270”, “BUKI-1311”, “BETATEST-2194”]
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/OqBclmWeighted”
Tags: [TG_DYNAMIC, TG_DOWNER, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_DEPRECATED, TG_OFTEN_ZERO]
Description: “BCLM by query index for domAttr”
Authors: [“agorodilov”, “vvp”]
Responsibles: [“agorodilov”, “alsafr”]
}
Factor {
Index: 619
CppName: “FI_OQ_BCLM_PLAIN”
Name: “OqBclmPlain”
Ticket: [“BUKI-1185”, “BUKI-1270”, “BUKI-1311”, “BETATEST-2194”]
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/OqBclmPlain”
Tags: [TG_DYNAMIC, TG_DOWNER, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_DEPRECATED, TG_OFTEN_ZERO]
Description: “BCLM by query index for owners”
Authors: [“agorodilov”, “vvp”]
Responsibles: [“agorodilov”, “alsafr”]
}
Factor {
Index: 620
CppName: “FI_LINKS_ALIVE”
Name: “Links Alive”
Ticket: “BUKI-1130”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/LinksAlive”
Tags: [TG_STATIC, TG_DOC, TG_USER, TG_BROWSER, TG_LINK_GRAPH, TG_TRANS, TG_UNUSED, TG_OFTEN_ZERO, TG_L2]
Description: “Allows you to evaluate whether a document is ‘live’ in terms of incoming links to it.”
Authors: [“egoist”, “vvp”]
Responsibles: [“egoist”, “alsafr”]
}
Factor {
Index: 621
CppName: “FI_SMALL_WINDOW”
Name: “SmallWindow”
Ticket: “BUKI-1311”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/SmallWindow”
Group: “Combined Abs”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_DEPRECATED, TG_REARR_USE]
Description: “Maximum weight of query words in a window of 50 words”
Authors: “denplusplus”
Responsibles: “alsafr”
}
Factor {
Index: 622
CppName: “FI_METRIKA_URL_VISITORS”
Name: “MetrikaUrlVisitors”
Ticket: “BUKI-1148”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/MetrikaUrlVisitors”
Tags: [TG_STATIC, TG_DOC, TG_USER, TG_COUNTER, TG_METRIKA, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_30D, TG_NN_OVER_FEATURES_USE]
Description: “Similar to YabarUrlVisitors”
Authors: “smikler”
Responsibles: [“smikler”, “tarum”, “niknik”]
}
Factor {
Index: 623
CppName: “FI_METRIKA_URL_AVG_TIME”
Name: “MetrikaUrlAvgTime”
Ticket: “BUKI-1148”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/MetrikaUrlAvgTime”
Tags: [TG_STATIC, TG_DOC, TG_USER, TG_COUNTER, TG_METRIKA, TG_L2, TG_REARR_USE, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_30D, TG_NN_OVER_FEATURES_USE]
Description: “Similar to YabarUrlAvgTime”
Authors: “smikler”
Responsibles: [“smikler”, “tarum”, “niknik”]
}
Factor {
Index: 624
CppName: “FI_METRIKA_URL_CORE_AUDIENCE”
Name: “MetrikaUrlCoreAudience”
Ticket: “BUKI-1268”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/MetrikaUrlCoreAudience”
Tags: [TG_STATIC, TG_DOC, TG_USER, TG_COUNTER, TG_METRIKA, TG_DEPRECATED, TG_UNUSED]
Description: “Audience core of pages that have a Metrica counter”
Authors: “smikler”
Responsibles: “smikler”
}
Factor {
Index: 625
CppName: “FI_REGEX_MAX_CLICK_PERCENT”
Name: “RegexMaxClickPercent”
Ticket: “BUKI-1300”
Wiki: “http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/regexmaxclickpercent”
Group: “Regex”
Tags: [TG_DYNAMIC, TG_DOC, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_L2, TG_DEPRECATED]
Description: “Percentage of clicks on this URL among all clicks on similar queries”
Authors: “finder”
Responsibles: [“smikler”, “tsimkha”]
}
Factor {
Index: 626
CppName: “FI_REGEX_CTR”
Name: “RegexCtr”
Ticket: “BUKI-1300”
Wiki: “http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/regexctr”
Group: “Regex”
Tags: [TG_DYNAMIC, TG_DOC, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_L2, TG_DEPRECATED]
Description: “corrected CTR of this url for all related queries”
Authors: “finder”
Responsibles: [“smikler”, “tsimkha”]
}
Factor {
Index: 627
CppName: “FI_DOM_PHRASE_CLICK_RANK_BI”
Name: “DomPhraseClickRankBi”
Ticket: “BUKI-1278”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/Domfeat”
Group: “domain”
Tags: [TG_DYNAMIC, TG_DOWNER, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_DEPRECATED, TG_UNDOCUMENTED]
Description: “Domain CTR by bigrams (excluding thesaurus query extensions)”
Authors: [“finder”, “kartynnik”]
Responsibles: [“kartynnik”,”akhropov”]
}
Factor {
Index: 628
CppName: “FI_DOM_PHRASE_YABAR_BI”
Name: “DomPhraseYabarBi”
Ticket: “BUKI-1278”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/Domfeat”
Group: “domain”
Tags: [TG_DYNAMIC, TG_DOWNER, TG_USER, TG_BROWSER, TG_USER_SEARCH, TG_DEPRECATED, TG_UNDOCUMENTED]
Description: “Transitions to the site from search engines by bigrams, according to Bar (excluding thesaurus query extensions)”
Authors: [“finder”, “kartynnik”]
Responsibles: [“kartynnik”,”akhropov”]
}
Factor {
Index: 629
CppName: “FI_LAST_WORD_HOST_CLICKS”
Name: “LastWordHostClicks”
Ticket: “BUKI-1278”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/Domfeat”
Group: “domain”
Tags: [TG_DYNAMIC, TG_OWNER, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_DEPRECATED, TG_UNDOCUMENTED, TG_OFTEN_ZERO]
Description: “Host click-through rate for the last query word (excluding thesaurus query extensions)”
Authors: [“finder”, “kartynnik”]
Responsibles: [“kartynnik”,”akhropov”]
}
Factor {
Index: 630
CppName: “FI_HOST_HAS_FEED_URLS”
Name: “HostHasFeedUrls”
Ticket: “SEARCHSPAM-15486”
Authors: [“bikulov”]
Responsibles: [“bikulov”, “ulyanov”]
Description: “OffersBase feature for ecoboost.”
Tags: [TG_HOST, TG_STATIC, TG_OFTEN_ZERO, TG_META_OVERWRITE, TG_UNUSED, TG_DATA_FROM_SAASKV, TG_UNIMPLEMENTED],
}
Factor {
Index: 631
CppName: “FI_IS_FEED_OFFER”
Name: “IsFeedOffer”
Ticket: “SEARCHSPAM-15486”
Authors: [“bikulov”]
Responsibles: [“bikulov”, “ulyanov”]
Description: “OffersBase feature for ecoboost.”
Tags: [TG_DOC, TG_STATIC, TG_BINARY, TG_OFTEN_ZERO, TG_META_OVERWRITE, TG_UNUSED, TG_DATA_FROM_SAASKV, TG_UNIMPLEMENTED],
}
Factor {
Index: 632
CppName: “FI_HOST_ECOM_KERNEL_1”
Name: “HostEcomKernel1”
Ticket: “SEARCHSPAM-15417”
Authors: [“ngoltsova”, “sdormidontov”]
Responsibles: [“bikulov”, “ngoltsova”, “sdormidontov”]
Description: “Business kernel.”
Tags: [TG_OWNER, TG_STATIC, TG_OFTEN_ZERO, TG_META_OVERWRITE, TG_UNUSED, TG_DATA_FROM_SAASKV, TG_UNIMPLEMENTED],
}
Factor {
Index: 633
CppName: “FI_HOST_ECOM_KERNEL_2”
Name: “HostEcomKernel2”
Ticket: “SEARCHSPAM-15417”
Authors: [“ngoltsova”, “sdormidontov”]
Responsibles: [“bikulov”, “ngoltsova”, “sdormidontov”]
Description: “Business kernel.”
Tags: [TG_OWNER, TG_STATIC, TG_OFTEN_ZERO, TG_META_OVERWRITE, TG_UNUSED, TG_DATA_FROM_SAASKV],
ImplementationTime: “2020-09-24”
}
Factor {
Index: 634
CppName: “FI_HOST_ECOM_KERNEL_3”
Name: “HostEcomKernel3”
Ticket: “SEARCHSPAM-15417”
Authors: [“ngoltsova”, “sdormidontov”]
Responsibles: [“bikulov”, “ngoltsova”, “sdormidontov”]
Description: “Business kernel.”
Tags: [TG_OWNER, TG_STATIC, TG_OFTEN_ZERO, TG_META_OVERWRITE, TG_UNUSED, TG_DATA_FROM_SAASKV, TG_UNIMPLEMENTED],
}
Factor {
Index: 635
CppName: “FI_RC_SEARCH_BASE_URL_RATIONAL_SIGMOID_D1TM600_AT_REQ”
Name: “RcSearchBaseUrlRationalSigmoidD1TM600AtReq”
Group: “Rapid Clicks”
Tags: [TG_STATIC, TG_DOC, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_L2, TG_SEARCH_RAPID_CLICKS_BIGRT, TG_DATA_FROM_BIGRT, TG_UNDOCUMENTED, TG_UNUSED]
Description: “URL feature computed at the request time from rapid clicks search counters with decay of 1 day”
Ticket: “USERFEAT-1503”
Authors: [“skorodumov-s”]
Responsibles: [“skorodumov-s”, “tarum”]
ImplementationTime: “2020-10-04”
}
Factor {
Index: 636
CppName: “FI_SYNSET_LOCM”
Name: “SynSetLocm”
Ticket: “SEARCH-218”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/SynSetLocm”
Group: “SynSetLocm”
Tags: [TG_DYNAMIC, TG_DOC, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_LINK_TEXT, TG_DEPRECATED]
Description: “A copy of the factor ((http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/Locm LOCM)) for((http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ ObshayaFormula/TekushhieKomponenty/Synset of synsets)).”
Authors: “alexeykruglov”
Responsibles: “alexeykruglov”
}
Factor {
Index: 637
CppName: “FI_SYNSET_LINK_BM25”
Name: “SynSetLinkBM25”
Ticket: “SEARCH-218”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/SynSetLinkBM25”
Group: “Dynamic”
Tags: [TG_DYNAMIC, TG_DOC, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_LINK_TEXT, TG_OFTEN_ZERO, TG_DEPRECATED]
Description: “A copy of the LinkBM25 factor for ((http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/Synset of synsets)”).”
Authors: “alexeykruglov”
Responsibles: “alexeykruglov”
}
Factor {
Index: 638
CppName: “FI_RC_SEARCH_BASE_URL_CONTRAST_D30ODD0_9_X_D30T1_AT_REQ”
Name: “RcSearchBaseUrlContrastD30Odd0_9_X_D30T1AtReq”
Group: “Rapid Clicks”
Tags: [TG_STATIC, TG_DOC, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_L2, TG_SEARCH_RAPID_CLICKS_BIGRT, TG_DATA_FROM_BIGRT, TG_UNDOCUMENTED, TG_UNUSED]
Description: “URL feature computed at the request time from rapid clicks search counters with decay of 30 days”
Ticket: “USERFEAT-1503”
Authors: [“skorodumov-s”]
Responsibles: [“skorodumov-s”, “tarum”]
ImplementationTime: “2020-10-04”
}
Factor {
Index: 639
CppName: “FI_REMOVED_639”
Name: “Removed_639”
Tags: [TG_REMOVED]
}
Factor {
Index: 640
CppName: “FI_DMOZ_QUERY_BEST_THEME”
Name: “DmozQueryBestTheme”
DependsOn: [{Feature: [“DmozQueryBestTheme”], Slice: “begemot_query_factors”}]
Ticket: “FOREIGN-221”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/DmozQueryBestTheme”
Group: “Query”
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_THEME_CLASSIF, TG_UNDOCUMENTED, TG_L2, TG_DEPRECATED]
Description: “The most likely query topic, determined by ((http://wiki.yandex-team.ru/JandeksPoisk/ZarubezhnyjjInternet/DMOZqueryClassifier1 by the DMOZTheme wizard’s rule)), only the most popular topics are taken into account (but there are more of them than in the DmozQueryThemes factor). The factor contains the probability that the query matches the topic, but for each topic, its own interval is taken on the interval [0..1]”
Authors: “lamo”
Responsibles: “lamo”
}
Factor {
Index: 641
CppName: “FI_DMOZ_QUERY_THEMES”
Name: “DmozQueryThemes”
DependsOn: [{Feature: [“DmozQueryThemes”], Slice: “begemot_query_factors”}]
Ticket: “FOREIGN-221”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/DmozQueryThemes”
Group: “Query”
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_THEME_CLASSIF, TG_UNDOCUMENTED, TG_L2, TG_DEPRECATED]
Description: “The query topic defined by ((http://wiki.yandex-team.ru/JandeksPoisk/ZarubezhnyjjInternet/DMOZqueryClassifier1 by the DMOZTheme wizard rule)) only a few of the most popular topics are taken into account.”
Authors: “lamo”
Responsibles: “lamo”
}
Factor {
Index: 642
CppName: “FI_DIVERSITY_CATEG_NEED_PHOTO”
Name: “DiversityCategNeedPhoto”
DependsOn: [{Feature: [“DiversityCategNeedPhoto”], Slice: “begemot_query_factors”}]
Ticket: “BUKI-1213”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/DiversityCategFactors”
Group: “Query”
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_THEME_CLASSIF, TG_UNDOCUMENTED, TG_L2, TG_DEPRECATED]
Description: “0 or 1 depending on whether the request has an explicit need_photo intent from the variety”
Authors: “stasd07”
Responsibles: “stasd07”
}
Factor {
Index: 643
CppName: “FI_DIVERSITY_CATEG_NEED_MAP”
Name: “DiversityCategNeedMap”
DependsOn: [{Feature: [“DiversityCategNeedMap”], Slice: “begemot_query_factors”}]
Ticket: “BUKI-1213”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/DiversityCategFactors”
Group: “Query”
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_THEME_CLASSIF, TG_UNDOCUMENTED, TG_L2, TG_DEPRECATED]
Description: “0 or 1 depending on whether the request has an explicit need_map intent from the variety”
Authors: “stasd07”
Responsibles: “stasd07”
}
Factor {
Index: 644
CppName: “FI_LONG_QUERY_SYN”
Name: “LongQuerySyn”
DependsOn: [{Feature: [“LongQuerySyn”], Slice: “begemot_query_factors”}]
Ticket: “BUKI-1361”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/LongQuerySyn”
Group: “Query”
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_UNDOCUMENTED, TG_L2, TG_L3_OVERWRITE, TG_DEPRECATED]
Description: “Factor is analogous to LongQuery (the sum of idf of query words), but with ‘correct’ consideration of synonyms. Specifically, the minimum by idf (i.e. the most frequent) of synonyms and the word is selected.”
Authors: “morph”
Responsibles: “morph”
}
Factor {
Index: 645
CppName: “FI_URL_HAS_SHORT_COUNTRY_NAME_TOKEN”
Name: “UrlHasShortCountryNameToken”
Ticket: “FACTOR-2431”
Tags: [TG_DYNAMIC, TG_URL_TEXT, TG_LOCALIZED_COUNTRY, TG_L2, TG_BINARY, TG_NN_OVER_FEATURES_USE]
Description: “The url contains a token that matches the short name of the user’s country. The factor is only considered on the EU stream.”
Authors: “film”
Responsibles: “film”
ImplementationTime: “2020-09-24”
}
Factor {
Index: 646
CppName: “FI_TURKEY_PAGE_RANK”
Name: “TurkishPageRank”
Ticket: FOREIGN-225
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/TurkeyPageRank”
Tags: [TG_LINK_GRAPH, TG_OWNER, TG_STATIC, TG_LOCALIZED_COUNTRY, TG_UNDOCUMENTED, TG_UNUSED, TG_OFTEN_ZERO]
Countries: CNT_TR
Description: “Personalized Turkish PageRank”
Authors: “lamo”
Responsibles: “lamo”
}
Factor {
Index: 647
CppName: “FI_EXPECTED_FOUND”
Name: “Expected Found”
Ticket: FOREIGN-225
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/ExpectedFound”
Group: “Query”
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_UNDOCUMENTED, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_NN_OVER_FEATURES_USE]
Description: “Expected number of search results”
Authors: “denplusplus”
Responsibles: “alsafr”
}
Factor {
Index: 648
CppName: “FI_FOOTER_IN_LINKS_TRIGRAMS”
Name: “FooterInLinksTrigrams”
Ticket: “BUKI-1341”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/FooterInLinksTrigrams”
Tags: [TG_DOC, TG_DOC_TEXT, TG_LINK_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_DEPRECATED]
Description: “Proportion of unique footer snippet trigrams in link trigrams”
Authors: “morph”
Responsibles: “morph”
}
Factor {
Index: 649
CppName: “FI_LINKS_IN_FOOTER_TRIGRAMS”
Name: “LinksInFooterTrigrams”
Ticket: “BUKI-1341”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/FooterInLinksTrigrams”
Tags: [TG_DOC, TG_DOC_TEXT, TG_LINK_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_DEPRECATED]
Description: “Percentage of Unique Link Trigrams in Footer Trigram Fragment”
Authors: “morph”
Responsibles: “morph”
}
Factor {
Index: 650
CppName: “FI_ERRATUM_LOG_QUERY_PROBABILITY”
Name: “ErratumLogQueryProbability”
DependsOn: [{Feature: [“ErratumLogQueryProbability”], Slice: “begemot_query_factors”}]
Ticket: “BUKI-1388”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/ErratumLogQueryProbability”
Group: “Query”
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_USER, TG_BROWSER, TG_COUNTER, TG_USER_SEARCH, TG_USER_EXT_DATA, TG_UNDOCUMENTED, TG_L2, TG_DEPRECATED]
Description: “Binary logarithm of the query probability for the language model of the erratum typo service”
Authors: “now”
Responsibles: [“snow”, “christich”]
}
Factor {
Index: 651
CppName: “FI_URL_IS_MARKET_OFFER”
Name: “UrlIsMarketOffer”
Ticket: “COMMERCIAL-41”
Description: “Url is an offer in the latest version of the market base.”
Tags: [TG_DOC, TG_STATIC, TG_OFTEN_ZERO, TG_UNUSED]
Authors: [“hygge”, “alejes”]
Responsibles: [“hygge”, “alejes”]
ImplementationTime: “2020-09-27”
}
Factor {
Index: 652
CppName: “FI_DBM40”
Name: “DBM40”
Group: “DBM25”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_NN_OVER_FEATURES_USE]
Description: “Variation on the theme ((http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/DBM25 DBM25)), see ysite/yandex/relevance/dbm25.cpp”
Authors: “denplusplus”
Responsibles: “alsafr”
}
# TODO(FACTORDEL-97): replace with TG_REMOVED, TG_REUSABLE and remove old formulas
Factor {
Index: 653
CppName: “FI_REMOVED_653”
Name: “Removed_653”
Tags: [TG_UNUSED]
}
Factor {
Index: 654
CppName: “FI_BM25_0”
Name: “BM25_0”
Ticket: FOREIGN-225
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/ExpectedFound”
Group: “DBM25”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: “Variation on BM25 theme”
Authors: “denplusplus”
Responsibles: “alsafr”
}
Factor {
Index: 655
CppName: “FI_BM25_1”
Name: “BM25_1”
Ticket: FOREIGN-225
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/ExpectedFound”
Group: “DBM25”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: “Variation on BM25 theme”
Authors: “denplusplus”
Responsibles: “alsafr”
}
Factor {
Index: 656
CppName: “FI_BM25_0123”
Name: “BM25_0123”
Ticket: FOREIGN-225
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/ExpectedFound”
Group: “DBM25”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: “Variation on BM25 theme”
Authors: “denplusplus”
Responsibles: “alsafr”
}
Factor {
Index: 657
CppName: “FI_QUERY_URL_CORRECTED_CTR”
Name: “QueryUrlCorrectedCtr”
Ticket: “BUKI-1291”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/QueryUrlCorrectedCtr”
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_1832D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_SEARCH_DWELL_TIME, TG_USERFEAT_USF, TG_FORMULA_2245_DEP_2, TG_DEPRECATED]
Countries: CNT_RELEV
Description: “‘Fixed’ clicks counted with RequestAggregateLib”
Authors: “kcd”
Responsibles: [“smikler”, “tarum”, “niknik”]
}
Factor {
Index: 658
CppName: “FI_QUERY_URL_CORRECTED_CTR_REG”
Name: “QueryUrlCorrectedCtr_Reg”
Ticket: “BUKI-1291”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/QueryUrlCorrectedCtr”
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_REGION, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_LOCALIZED_COUNTRY, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_1832D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_SEARCH_DWELL_TIME, TG_USERFEAT_USF, TG_FORMULA_2245_DEP_2, TG_DEPRECATED]
Countries: CNT_RELEV
Description: “‘Corrected’ clicks counted with RequestAggregateLib. Regional Version”
Authors: “kcd”
Responsibles: [“smikler”, “tarum”, “niknik”]
}
Factor {
Index: 659
CppName: “FI_YABAR_URL_VISITS_REG”
Name: “YabarUrlVisits_Reg”
Ticket: “BUKI-1180”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/YabarUrlFactors”
Group: “RegDocStatic”
Tags: [TG_STATIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_BROWSER, TG_USER_EXT_DATA, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE_TG_USERFTS]
Countries: CNT_RELEV
Description: “Regional url traffic according to i-bar”
Authors: “akhropov”
Responsibles: [“tarum”, “niknik”]
}
Factor {
Index: 660
CppName: “FI_METRIKA_URL_HOST_VISIT_TIME”
Name: “MetrikaUrlHostVisitTime”
Ticket: [“BUKI-1272”, “BUKI-1312”]
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/MetrikaUrlHostVisitTime”
Tags: [TG_STATIC, TG_DOC, TG_USER, TG_COUNTER, TG_METRIKA, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_30D, TG_NN_OVER_FEATURES_USE]
Description: “Average time a user spends on the host when accessed externally (from another non-search site) from a specific URL”
Authors: [“gosu”, “smikler”]
Responsibles: [“smikler”, “tarum”, “niknik”]
}
Factor {
Index: 661
CppName: “FI_METRIKA_URL_HOST_VISIT_DEPTH”
Name: “MetrikaUrlHostVisitDepth”
Ticket: [“BUKI-1271”, “BUKI-1312”]
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/MetrikaUrlHostVisitDepth”
Tags: [TG_STATIC, TG_DOC, TG_USER, TG_COUNTER, TG_METRIKA, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_30D, TG_NN_OVER_FEATURES_USE]
Description: “Average ‘depth’ (number of hits within the host) of a user’s stay on the host when accessed externally (from another non-search site) from a specific URL”
Authors: [“gosu”, “smikler”]
Responsibles: [“smikler”, “tarum”, “niknik”]
}
Factor {
Index: 662
CppName: “FI_DBM_NUMBERS”
Name: “DBM Numbers”
Group: “DBM25”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_NN_OVER_FEATURES_USE]
Description: “DBM separately by numbers”
Authors: “denplusplus”
Responsibles: “alsafr”
}
Factor {
Index: 663
CppName: “FI_DBM_GEO”
Name: “DBMGeo”
Group: “DBM25”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_NN_OVER_FEATURES_USE]
Description: “DBM separately by request geo-objects”
Authors: “denplusplus”
Responsibles: “alsafr”
}
Factor {
Index: 664
CppName: “FI_DBM_SUBSTANTIVE”
Name: “DBMSubstantive”
Group: “DBM25”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_NN_OVER_FEATURES_USE]
Description: “DBM separately by nouns”
Authors: “denplusplus”
Responsibles: “alsafr”
}
Factor {
Index: 665
CppName: “FI_AVG_SESSION_LEN”
Name: “AvgSessionLen”
DependsOn: [{Feature: [“AvgSessionLen”], Slice: “begemot_query_factors”}]
Group: “Query”
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_L2, TG_USERFEAT, TG_USERFEAT_90D, TG_DEPRECATED]
Description: “Average length of the logical session in which the request was”
Wiki: “http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/AvgSessionLen”
Authors: “denplusplus”
Responsibles: [“tarum”, “niknik”]
}
Factor {
Index: 666
CppName: “FI_NHOP_TEXT_BCLM_WEIGHTED”
Name: “NHopTextBclmWeighted”
Group: “Annotation”
Ticket: “FACTOR-108”
Wiki: “http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/NHopText”
Tags: [TG_DYNAMIC, TG_DOC, TG_USER, TG_BROWSER, TG_USER_SEARCH, TG_USER_EXT_DATA, TG_LOCALIZED_COUNTRY, TG_ANNOTATION_FILTER, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_238D, TG_USERFEAT_NHOP]
Countries: CNT_RELEV
Description: “Bclm (weighted) based on lyrics from hops.”
Authors: “vvp”
Responsibles: “alsafr”
}
Factor {
Index: 667
CppName: “FI_YABAR_URL_DOWNLOADS”
Name: “YabarUrlDownloads”
Ticket: “SEARCHSPAM-3039”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/YabarUrlDownloads”
Tags: [TG_STATIC, TG_DOC, TG_USER, TG_BROWSER, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_VISITS_ACTIVITY_DOWNLOADS]
Description: “document jump probability estimate”
Authors: “ulyanov”
Responsibles: [“ulyanov”, “tarum”, “niknik”]
}
Factor {
Index: 668
CppName: “FI_BOCM”
Name: “Bocm”
Ticket: “BUKI-1495”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/Bocm”
Group: “Bocm”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_NN_OVER_FEATURES_USE]
Description: “Evaluates whether word positions in document sentences match word positions in a query.”
Authors: “alsafr”
Responsibles: “alsafr”
}
Factor {
Index: 669
CppName: “FI_HOST_USER_LEAKAGE”
Name: “HostUserLeakage”
Ticket: “COMMERCIAL-55”
Tags: [TG_OWNER, TG_STATIC, TG_L2, TG_NOT_01, TG_DATA_FROM_SAASKV, TG_UNUSED]
Description: “Churn rate of users from the search after visiting the site”
Authors: “alejes”
Responsibles: “alejes”
MaxValue: 1.0
MinValue: -1.0
ImplementationTime: “2020-08-27”
}
Factor {
Index: 670
CppName: “FI_FIO_MATCH”
Name: “FioMatch”
Ticket: “FACTEX-2467”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/OpisanijaFaktorov/FioMatchFactor”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNUSED]
Description: “The document contains the full name from the request.”
Authors: “udovichenko-r”
Responsibles: “udovichenko-r”
}
Factor {
Index: 671
CppName: “FI_IS_INDEX_PAGE”
Name: “IsIndexPage”
Ticket: FORMULATOR-185
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/IsIndexPage”
Tags: [TG_DOC, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “This is index.(html/php/aspx?/…), without cgi parameters. It counts over all takes.”
Authors: “smikler”
Responsibles: “smikler”
}
Factor {
Index: 672
CppName: “FI_IS_INDEX_PAGE_SOFT”
Name: “IsIndexPageSoft”
Ticket: FORMULATOR-185
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/IsIndexPage”
Tags: [TG_DOC, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “This is index.(html/php/aspx?/…), possibly with cgi parameters. It counts over all takes.”
Authors: “smikler”
Responsibles: “smikler”
}
Factor {
Index: 673
CppName: “FI_IS_OWNER”
Name: “IsOwner”
Ticket: FORMULATOR-185
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/IsIndexPage”
Tags: [TG_HOST, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “Whether the host is its own owner, conditionally Host == Owner(Host).”
Authors: “smikler”
Responsibles: “smikler”
}
Factor {
Index: 674
CppName: “FI_MIN_PATH_LEN”
Name: “MinPathLen”
Ticket: FORMULATOR-185
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/IsIndexPage”
Tags: [TG_DOC, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “Minimum length of PathAndQuery across all half-doubles.”
Authors: “smikler”
Responsibles: “smikler”
}
Factor {
Index: 675
CppName: “FI_LERF_GEO_LR_LOG_RELEV_CNT”
Name: “XLerfGeoLRlogRelevCnt”
Ticket: “BUKI-1433”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/XLerfGeoLRlogRelevCnt”
Group: “Xref”
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: “Regionalized (only links from the country of the request are taken) version of the XLerfGeoLRlogRelev factor”
Authors: “mdvornikov”
Responsibles: “mdvornikov”
}
Factor {
Index: 676
CppName: “FI_NON_COMM_LERF_NORM_LR_LOG_RELEV_CNT”
Name: “XNonCommLerfNormLRlogRelevCnt”
Ticket: “BUKI-1433”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/XNonCommLerfNormLRlogRelevCnt”
Group: “Xref”
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: “Regionalized (only links from the request country are taken) variant of the XNonCommLerfNormLRlogRelev factor”
Authors: “mdvornikov”
Responsibles: “mdvornikov”
}
Factor {
Index: 677
CppName: “FI_LOCM_CNT”
Name: “LocmCnt”
Ticket: “BUKI-1433”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/LocmCnt”
Group: “Xref”
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: “Regionalized (only links from the country of the request are taken) version of the Locm factor”
Authors: “mdvornikov”
Responsibles: “mdvornikov”
}
Factor {
Index: 678
CppName: “FI_LR_RELEV_CNT”
Name: “XLRrelevCnt”
Ticket: “BUKI-1433”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/XLRrelevCnt”
Group: “Xref”
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: “Regionalized (only links from the country of the request are taken) variant of the XLRrelev factor”
Authors: “mdvornikov”
Responsibles: “mdvornikov”
}
Factor {
Index: 679
CppName: “FI_LERF_LR_RELEV_200_CNT”
Name: “XLerfLRrelev200Cnt”
Ticket: “BUKI-1433”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/XLerfLRrelev200Cnt”
Group: “Xref”
Tags: [TG_DOC, TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: “Regionalized (only links from the country of the request are taken) version of the XLerfLRrelev200 factor”
Authors: “mdvornikov”
Responsibles: “mdvornikov”
}
Factor {
Index: 680
CppName: “FI_NAV_LINEAR”
Name: “NavLinear”
Ticket: [“COMBPROLAB-107”, “SEARCHSPAM-3340”]
Wiki: “http://wiki.yandex-team.ru/MaratXabibraxmanov/seminavigationqueries”
Tags: [TG_DYNAMIC, TG_DOC, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_NAV, TG_TRANS, TG_REARR_USE, TG_DEPRECATED]
Description: “((http://wiki.yandex-team.ru/JandeksPoisk/Antispam/polunavigacionnyezaprosy#faktornavigacionnostiparyurl-zapros classifier)) pair of vitals [request-url], vital url for the request, if the value on it is >0.5”
Authors: [“burangulov”, “kustarev”]
Responsibles: “burangulov”
DependsOn: [{Feature: [“PR”, “LR”, “PrBonus”, “TRp2”, “LRp2”, “Shop”, “YaBar”, “Long”, “LongQuery”, “SR”, “LRHitNum100” , “PctLinks”, “LinkQuality”, “AddTime”, “TLBM25”, “Adv”, “YandexAdv”, “TxtPair”, “TxtHead”, “HasNoQueryShows”, “LogLR”, “TxtPairEx”, “TxtBreakEx”, ” TxtHeadEx”, “TxtPairSy”, “TxtBreakSy”, “TxtHeadSy”, “TxtHiRelSy”, “QueryDOwnerClicksPCTR”, “HasNoQueryDOwnerShows”, “OwnerClicksPCTR”, “XLRp2”, “XLRgood”, “XLRmaxDpr”, “NewLinkQuality”, “TextFeatures” , “TextLike”, “SpamKarma”, “DocLen”, “UrlLen”, “HostSize”, “LinkSpeed”, “XLerfLRlogRelev”, “GeoCityProxim”, “LinksWithWordsPercent”, “LinksWithAllWordsPercent”, “IsComm”, “GeoRegionProxim”, ” TxtSkipPair”, “QDiversity”, “XGeoLRlogRelev”, “XLerfGeoLRlogRelev”, “XNonCommNormLRlogRelev”, “Nevasca2”, “LinkAge”, “XLerfLangLRlogRelev”, “QueryDOwnerClicksFRC”, “QueryDOwnerClicksPCTR_Reg”, “QueryURLClicksFRC_Reg”, “QueryDOwnerClicks”RegboReglicks”, “QueryDOwnerClicks”RegboReglicks”, “QueryDOwnerClicks”RegboReglicks , “XLRCatalogRelev”, “TLp1All”, “BFlemmaAll”, “PassageLegacyTR”, “Tx tBM25AttenSyn”, “MaxWordHostRank”, “MaxWordHostClicks”, “DomPhraseClickRank”, “EshopValue”, “CountersSearchTraffic1”, “CountersSearchTraffic2”, “DomPhraseYabar”, “GeoRelevRegionCountry”, “XLRGeoRelevRegionCountry”, “GeoCountryProxim”, “MaxWordHostsYaBar”, “ClicktWar” , “QueryDOwnerYabarVisits”, “QueryDOwnerYabarVisitors”, “QueryDOwnerYabarAvgTime”, “PageRegionSizeIn”, “PageRegionInvSizeIn”, “GeoGeometryProxim”, “RingsHostRankBadnessOld”, “YabarHostVisitors”, “YabarHostSearchTraffic”, “YabarAHostInternalTraffic”, “YabarTime”, “Host YabarHostAvgActions”, “YabarUrlVisits”, “YabarUrlVisitors”, “YabarUrlAvgTime”, “OwnerSatisfied4Rate”, “TitleIdfSum_broken”, “HeadingIdfSum_broken”, “CommLinksSEOHosts”, “CommLinksSEOHostsNonComm”, “Diversity2”, “MorningQuery”, “LCorryM”, “SubqueryM”, “SubquequeActions” , “OwnerSDiffClickEntropy”, “OwnerSDiffShowEntropy”, “OwnerSDiffCSRatioEntropy”, “UrlDomainFraction”, “UrlPathAndParamsFraction”, “LnkBreak”, “LnkPairSy”, “LnkBrkSy”, “OwnerClicksP CTR_Reg”, “OwnerSDiffClickEntropy_Reg”, “OwnerSDiffShowEntropy_Reg”, “OwnerSDiffCSRatioEntropy_Reg”, “IsCom”, “IsNotRu”, “LargestSyInexactGroup”, “SynFLremap1”, “SynFLremap2”, “OwnerSessNormDuration”, “UrlSessQueryNormDurRate”, “QueryDOwnerWeightRate” , “QueryDOwnerClickSummary”, “QueryDOwnerSatisfied4Rate”, “SyntQuality”, “PageDate”, “RingsHostRankBadness3”, “QSegmentsBM25”, “QSegmentsWeight”, “NumLatinLetters”, “RingsHostRankBadness1”, “TitleIdfSumFixed”, “HeadingIdfSumFixed”, “QueryDOwnerClicksCombo”, ” LRAmortizedByAge”, “RusWordsInTitle”, “MeanWordLength”, “PercentWordsInLinks”, “PercentVisibleContent”, “PercentFreqWords”, “PercentUsedFreqWords”, “TrigramsProb”, “TrigramsCondProb”, “UrlBM25”, “MatrixNet”, “DaterAge”, “CInDegree2” , “TextMaxForms”, “TextWeightedForms”, “TextForms”, “LinkWeightedForms”, “QSegmentsBreaks”, “ParticlesPortion”, “AdjPronounsPortion”, “AdvPronounsPortion”, “FemAndMasNounsPortion”, “LinkQualityFixed”, “NewLinkQualityFixed”, “IsOrg”, ” LongestText”, “LRWithoutRare”, “DifferentInternalLinks”, “HasDeterminedCities”, “UkrainPageRank”, “QClassOAO”, “PeriodicLinkDatesPercent”, “QDOwnerStatPower”, “QUrlStatPower”, “OwnerReqsPopularity”, “SecondIndegDistrXi”, “Swbm25”, “PositionLanguageModel” , “TxtPair_W1”, “AuraDocLogShared”, “AuraDocLogAuthor”, “AuraDocMeanSharedWeight”, “RegHostRank”, “LanguageCompliance”, “CountryQDiversity”, “CountryQDiversity2”, “CountryQueryRegionality”, “NumSlashes”, “BM25FdPR_obsolete”, “GskUrlModel”, ” UrlTrigrams”, “YmwFull”, “Bclm”, “QueryCommercialityMx”, “FieldLM”, “GeoCityUrlRegionCountry”, “TitleTrigramsQuery”, “QueryWordSequencesTR”, “OwnerNavQuota”, “GeoRelevAlienCity”, “HostReliability”, “Mpsa”, “PageRegionCoverage” , “PageRegionSize”, “PageRegionRelCoverage”, “IsGeo”, “CityQuery”, “YmwFull2”, “QueryWordCohesionTR”, “QueryDOwnerWeightClick_Reg”, “QueryDOwnerOnlyClickRate_Reg”, “QueryDOwnerClickSummary_Reg”, “QueryDOwnerSatisfied4Rate_Reg”, “SegmentAuxAlphasInText”, “IsShop”, “XLRGeoRelevRegionNatDomain”, “QueryRefTrigramQuery”, “QueryRefTrigramReferences”, “IdfVariance”, “UrlNGramsModel”, “NumLinksFromSegmentContent”, “Locm”, “UrlQueryVariety_Reg”, “UrlSessNormDurRate_Reg”, “QueryDownerEnoughClicked”, “BM25FdPRFixed”, “QueryDOwnerWeightedSumFRCAndBM25FdPRFixed “, “QueryDOwnerWeightedSumMaxWHRAndOnlyClickRate”, “Tocm”, “RelevGeoLinksPercent”, “UrlLinkPercent”, “NumNonLettersInUrl”, “UrlLen2”, “IsHub”, “StaticTitleBM25Ex”, “StaticTitleLRBM25”, “SeoInPayLinks”, “TitleInLinksTrigrams”, “TrisIngrams”, “YabarUrlLcAc”, “SOMaxSumSourceRank”, “DBM35”, “TRLRQuorumFm”, “TRLRQuorumLemma”, “IsHum”, “MaxOne”, “MinOne”, “OqBm25Str”, “OqBm25Lem”, “OqBm25Syn”, “OqBclmWeighted”, “OqBclmPlain “, “MetrikaUrlCoreAudience”, “DomPhraseClickRankBi”, “DomPhraseYabarBi”, “LastWordHostClicks”, “SynSetLocm”, “DmozQueryBestTheme”, “LongQuerySyn”, “ExpectedFound”]}]
}
Factor {
Index: 681
CppName: “FI_RANK_COM_GOODNESS”
Name: “RankComGoodness”
Ticket: [“BUKI-1504”, “SEARCHSPAM-3204”]
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/RankComGoodness”
Tags: [TG_COMMERCIAL, TG_OWNER, TG_STATIC, TG_THEME_CLASSIF, TG_UNDOCUMENTED, TG_L2, TG_MASCOT, TG_NN_OVER_FEATURES_USE]
Description: “Classifier according to the ratings of commercial sites”
Authors: [“anelyubin”, “sisoid”]
Responsibles: “efedina”
}
Factor {
Index: 682
CppName: “FI_HAS_DOWNLOAD_LINK_ON_FILE”
Name: “HasDownloadLinkOnFile”
Ticket: “ROBOT-2682”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/HasDownloadLinkOnFile”
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “The document has a direct link to the file”
Authors: “osenzen”
Responsibles: “osenzen”
}
Factor {
Index: 683
CppName: “FI_HAS_DOWNLOAD_LINK_ON_FILE_HOSTING”
Name: “HasDownloadLinkOnFileHosting”
Ticket: “ROBOT-2682”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/HasDownloadLinkOnFile”
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “There is a link to the file hosting on the document”
Authors: “osenzen”
Responsibles: “osenzen”
}
Factor {
Index: 684
CppName: “FI_DIVERSITY_CATEG_DOWNLOAD”
Name: “DiversityCategDownload”
DependsOn: [{Feature: [“DiversityCategDownload”], Slice: “begemot_query_factors”}]
Ticket: “ROBOT-2688”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/DiversityCategFactors”
Group: “Query”
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_DEPRECATED]
Description: “0 or 1 – does the request match the regex from the ticket”
Authors: “stasd07”
Responsibles: “stasd07”
}
Factor {
Index: 685
CppName: “FI_DIVERSITY_CATEG_REVIEW”
Name: “DiversityCategReview”
DependsOn: [{Feature: [“DiversityCategReview”], Slice: “begemot_query_factors”}]
Ticket: “ROBOT-2688”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/DiversityCategFactors”
Group: “Query”
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_UNDOCUMENTED, TG_L2, TG_DEPRECATED]
Description: “0 or 1 – does the request match the regex from the ticket”
Authors: “stasd07”
Responsibles: “stasd07”
}
Factor {
Index: 686
CppName: “FI_DIVERSITY_CATEG_WATCH”
Name: “DiversityCategWatch”
DependsOn: [{Feature: [“DiversityCategWatch”], Slice: “begemot_query_factors”}]
Ticket: “ROBOT-2688”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/DiversityCategFactors”
Group: “Query”
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_UNDOCUMENTED, TG_L2, TG_DEPRECATED]
Description: “0 or 1 – does the request match the regex from the ticket”
Authors: “stasd07”
Responsibles: “stasd07”
}
Factor {
Index: 687
CppName: “FI_TUR_QR”
Name: “Qrtur”
DependsOn: [{Feature: [“QrTur”], Slice: “begemot_query_factors”}]
Ticket: “QREG-27”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/QrTur”
Group: “Query”
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_UNDOCUMENTED, TG_L2, TG_REARR_USE, TG_DEPRECATED]
Description: “Predicting the share of “good” (at least with two different cities and frequency>=10) mentions of a query with geography in Turkey”
Authors: “esoloviev”
Responsibles: “esoloviev”
}
Factor {
Index: 688
CppName: “FI_QUERY_TH3561”
Name: “QueryThEncyclopedic”
DependsOn: [{Feature: [“QueryThEncyclopedic”], Slice: “begemot_query_factors”}]
Ticket: “QREG-28”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/Th3561”
Group: “Query”
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_THEME_CLASSIF, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_UNDOCUMENTED, TG_L2, TG_DEPRECATED]
Description: “The result of the lexical query classifier, which predicts the probability of a click on the topic page 3561”
Authors: “esoloviev”
Responsibles: “esoloviev”
}
Factor {
Index: 689
CppName: “FI_QUERY_TH3973”
Name: “QueryThVideohosting”
DependsOn: [{Feature: [“QueryThVideohosting”], Slice: “begemot_query_factors”}]
Ticket: “QREG-28”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/Th3561”
Group: “Query”
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_THEME_CLASSIF, TG_USER, TG_UNDOCUMENTED, TG_L2, TG_DEPRECATED]
Description: “The result of the lexical query classifier, which predicts the probability of a click on the topic page 3973”
Authors: “esoloviev”
Responsibles: “esoloviev”
}
Factor {
Index: 690
CppName: “FI_QUERY_IS_NAV_MX”
Name: “IsNavMxQuery”
DependsOn: [{Feature: [“IsNavMxQuery”], Slice: “begemot_query_factors”}]
Ticket: “SEARCHSPAM-3647”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/IsNavMxQuery”
Group: “Query”
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_NAV, TG_TRANS, TG_UNDOCUMENTED, TG_L2, TG_REARR_USE, TG_DEPRECATED]
Countries: CNT_RU
Description: “Query ‘navigability’ rank”
Authors: [“anelyubin”, “kvn”]
Responsibles: [“anelyubin”, “kvn”]
DependsOn: [{Feature: [“QueryNonCommerciality”, “ProductCategoryQuery”, “ProductCategoryVendor”, “IsNavQuery”, “QClassDownload”, “QClassBrandnames”, “QClassDisease”, “QClassKak”, “QClassMoscow”, “QClassOAO”, “QClassPorno” , “QClassTravel”, “CountryPopularQ”]}]
}
Factor {
Index: 691
CppName: “FI_QUERY_URL_YABAR_VISITS_REG”
Name: “QueryUrlYabarVisits_Reg”
Ticket: “BUKI-1180”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/YabarUrlFactors”
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_REGION, TG_USER, TG_BROWSER, TG_USER_SEARCH, TG_USER_EXT_DATA, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_238D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_VISITS_ACTIVITY_DOWNLOADS, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Description: “regional traffic from search engines for a specific query”
Authors: “akhropov”
Responsibles: [“tarum”, “niknik”]
}
Factor {
Index: 692
CppName: “FI_CLICKED_WITH_ANOTHER_SE_CLICKS”
Name: “ClickedWithAnotherSEClicks”
Ticket: “BUKI-1261”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ShowsAndClicksWithAnotherSEClicks”
Tags: [TG_STATIC, TG_DOC, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_UNDOCUMENTED, TG_L2, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_USF, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Description: “Clicks on the URLs shown in the search results for queries that went to search in other search engines”
Authors: “vvp”
Responsibles: [“alsafr”, “tarum”, “niknik”]
}
Factor {
Index: 693
CppName: “FI_SHOWS_WITH_ANOTHER_SE_CLICKS”
Name: “ShowsWithAnotherSEClicks”
Ticket: “BUKI-1261”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ShowsAndClicksWithAnotherSEClicks”
Tags: [TG_STATIC, TG_DOC, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_UNDOCUMENTED, TG_L2, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_USF, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Description: “Impressions of urls in the search results for requests for which they left to search in other search engines”
Authors: “vvp”
Responsibles: [“alsafr”, “tarum”, “niknik”]
}
Factor {
Index: 694
CppName: “FI_COMMERCIAL_OWNER_RANK_REG”
Name: “CommercialOwnerRank_Reg”
Ticket: [“BUKI-1503”, “SEARCHSPAM-3082”, “SEARCHSPAM-3486”]
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/CommercialOwnerRank_Reg”
Group: “RegHostStatic”
Tags: [TG_STATIC, TG_OWNER, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_COMMERCIAL, TG_THEME_CLASSIF, TG_UNDOCUMENTED, TG_L2, TG_MASCOT, TG_DEPRECATED]
Countries: [CNT_RU, CNT_TR]
Description: “Commercial site classifier”
Authors: [“anelyubin”, “sisoid”]
Responsibles: “efedina”
}
Factor {
Index: 695
CppName: “FI_HOST_IS_MARKET_OFFER”
Name: “HostIsMarketOffer”
Ticket: “COMMERCIAL-41”
Authors: [“hygge”, “alejes”]
Responsibles: [“hygge”, “alejes”]
Description: “There are offers from this host in the latest version of the market database.”
Tags: [TG_OWNER, TG_STATIC, TG_OFTEN_ZERO, TG_NN_OVER_FEATURES_USE]
ImplementationTime: “2020-09-23”
}
Factor {
Index: 696
CppName: “FI_BCLM_MAX”
Name: “BclmMax”
Ticket: “BUKI-1575”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/BclmMax”
Group: “Combined Abs”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_NN_OVER_FEATURES_USE]
Description: “Proximity of query words to the heaviest word.”
Authors: “alsafr”
Responsibles: “alsafr”
}
Factor {
Index: 697
CppName: “FI_URL_PRON_REGEXP_MATCH”
Name: “UrlPronRegexpMatch”
Ticket: “SEARCH-10629”
Tags: [TG_URL_TEXT, TG_UNUSED, TG_BINARY]
Description: “Url matches regexp expression given in pron”
Authors: “timuratshin”
Responsibles: “timuratshin”
}
Factor {
Index: 698
CppName: “FI_HAS_USER_REVIEWS”
Name: “HasUserReviews”
Ticket: “ROBOT-2571”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/HasUserReviews”
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “Document contains user feedback/comment”
Authors: [“bogomolov”, “kartynnik”, “osenzen”]
Responsibles: [“kartynnik”, “osenzen”]
}
Factor {
Index: 699
CppName: “FI_REGEX_MAX_CLICK_PERCENT_REG”
Name: “RegexMaxClickPercentReg”
Ticket: “BUKI-1300”
Wiki: “http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/regexmaxclickpercent”
Group: “Regex”
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_L2, TG_DEPRECATED]
Countries: CNT_RELEV
Description: “Percentage of clicks on this URL among all clicks on similar queries, country version, see ((http://wiki.yandex-team.ru/Development/Poisk/arcadia/indexregex indexregex))”
Authors: [“finder”, “kcd”]
Responsibles: [“smikler”, “tsimkha”]
}
Factor {
Index: 700
CppName: “FI_REGEX_CTR_REG”
Name: “RegexCtrReg”
Ticket: “BUKI-1300”
Wiki: “http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/regexctr”
Group: “Regex”
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_L2, TG_DEPRECATED]
Countries: CNT_RELEV
Description: “corrected CTR of this URL for all related queries, country version, see ((http://wiki.yandex-team.ru/Development/Poisk/arcadia/indexregex indexregex))”
Authors: [“finder”, “kcd”]
Responsibles: [“smikler”, “tsimkha”]
}
Factor {
Index: 701
CppName: “FI_FOUND”
Name: “Found”
DependsOn: [{Feature: [“Found”], Slice: “begemot_query_factors”}]
Wiki: “http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/Found”
Group: “Query”
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_L2, TG_USERFEAT, TG_USERFEAT_90D, TG_DEPRECATED]
Countries: CNT_ALL
Description: “Average number of search results”
Authors: “denplusplus”
Responsibles: [“tarum”, “niknik”]
}
Factor {
Index: 702
CppName: “FI_YABAR_WORD_DNGI”
Name: “YabarWordDepthNodesGradientMin”
DependsOn: [{Feature: [“YabarWordDepthNodesGradientMin”], Slice: “begemot_query_factors”}]
Ticket: “BUKI-1482”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/HostStatistics”
Group: “Query”
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_USER, TG_BROWSER, TG_USER_SEARCH, TG_L2, TG_DEPRECATED]
Description: “Angle in Depth Nodes space, counted by words only (Min by all)”
Authors: [“atolstikov”, “smikler”]
Responsibles: [“atolstikov”, “smikler”]
}
Factor {
Index: 703
CppName: “FI_DBM15_WARES”
Name: “DBM15Wares”
Ticket: “BUKI-1300”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/RegexCtr”
Group: “Combined Abs”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_NN_OVER_FEATURES_USE]
Authors: “denplusplus”
Responsibles: “alsafr”
}
Factor {
Index: 704
CppName: “FI_RANK_COM_GOODNESS_BAR”
Name: “RankComGoodnessBar”
Ticket: [“SEARCHSPAM-3759”, “SEARCHSPAM-3970”]
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/RankComGoodnessBar”
Tags: [TG_STATIC, TG_OWNER, TG_LOCALIZED_COUNTRY, TG_USER, TG_BROWSER, TG_COMMERCIAL, TG_THEME_CLASSIF, TG_UNDOCUMENTED, TG_L2, TG_MASCOT, TG_NN_OVER_FEATURES_USE]
Countries: CNT_RU
Description: “A classifier that approximates the quality of commercial sites based on user behavior data”
Authors: [“reat”, “sisoid”]
Responsibles: “efedina”
}
Factor {
Index: 705
CppName: “FI_DOC_CREATE_MONTH”
Name: “DocCreateMonth”
Ticket: “BUKI-1583”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/DocMonthFactors”
Tags: [TG_DATE, TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_DEPRECATED, TG_UNDOCUMENTED, TG_L2]
Description: “Document creation time accurate to the month 1.0 — current month, 0 — 10 years ago and older. Temporarily disabled”
Authors: “bochkarev”
Responsibles: “bochkarev”
}
Factor {
Index: 706
CppName: “FI_DOC_UPDATE_MONTH”
Name: “DocUpdateMonth”
Ticket: “BUKI-1583”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/DocMonthFactors”
Tags: [TG_DATE, TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_DEPRECATED, TG_UNDOCUMENTED, TG_L2]
Description: “Document update time accurate to the month 1.0 — current month, 0 — 10 years ago and older. Temporarily disabled”
Authors: “bochkarev”
Responsibles: “bochkarev”
}
Factor {
Index: 707
CppName: “FI_LR_SOURCERANK”
Name: “XLRSourceRank”
Wiki: “https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/XLR-SourceRank-MainPage”
Group: “Xref”
Tags: [TG_DYNAMIC, TG_LINK_GRAPH, TG_UNDOCUMENTED, TG_LINK_TEXT, TG_DEPRECATED]
Authors: “denplusplus”
Responsibles: “alsafr”
}
Factor {
Index: 708
CppName: “FI_LR_MAINPAGE”
Name: “XLRMainPage”
Wiki: “https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/XLR-SourceRank-MainPage”
Group: “Xref”
Tags: [TG_DYNAMIC, TG_LINK_GRAPH, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_LINK_TEXT, TG_DEPRECATED]
Authors: “denplusplus”
Responsibles: “alsafr”
}
Factor {
Index: 709
CppName: “FI_DATER_STATS_YEAR_NORM_LIKELIHOOD”
Name: “DaterStatsYearNormLikelihood”
Ticket: “BUKI-1619”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/DaterStatsYearNormLikelihood”
Tags: [TG_DATE, TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “Likelihood function for the distribution of years in a document. Temporarily disabled”
Authors: “bochkarev”
Responsibles: “bochkarev”
}
Factor {
Index: 710
CppName: “FI_HOST_NUM_SOVETNIK”
Name: “HostNumSovetnik”
Ticket: “CONTENTQUALITY-45”
Authors: [“sdormidontov”]
Responsibles: [“ulyanov”, “sdormidontov”]
Description: “Num of Sovetnik urls”
Tags: [TG_HOST, TG_STATIC, TG_OFTEN_ZERO, TG_UNUSED, TG_UNIMPLEMENTED],
}
Factor {
Index: 711
CppName: “FI_LCM_VAR”
Name: “LcmVar”
Ticket: “BUKI-1622”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/LocmVar”
Group: “Xref”
Tags: [TG_DYNAMIC, TG_LINK_TEXT, TG_UNDOCUMENTED, TG_DEPRECATED]
Description: “Dispersion in the number of query words in links.”
Authors: “alsafr”
Responsibles: “alsafr”
}
Factor {
Index: 712
CppName: “FI_DATER_STATS_AVERAGE_SOURCE_SEGMENT”
Name: “DaterStatsAverageSourceSegment”
Ticket: “BUKI-1619”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/DaterStatsAverageSourceSegment”
Tags: [TG_DATE, TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “Arithmetic mean of document date positions. Temporarily disabled”
Authors: “bochkarev”
Responsibles: “bochkarev”
}
Factor {
Index: 713
CppName: “FI_DBM15_WARES2”
Name: “DBM15Wares2”
Ticket: “BUKI-1300”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/RegexCtr”
Group: “Combined Abs”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_NN_OVER_FEATURES_USE]
Authors: “alsafr”
Responsibles: “alsafr”
}
Factor {
Index: 714
CppName: “FI_CABM”
Name: “Cabm”
Ticket: “BUKI-1629”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/Cabm”
Group: “Xref”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_LINK_TEXT, TG_DEPRECATED]
Description: “BM with fading on the text of catalog links.”
Authors: “alsafr”
Responsibles: “alsafr”
}
Factor {
Index: 715
CppName: “FI_BEAST_NQUERY_URL_MEAN_POS”
Name: “BeastNqUrlMeanPos”
Ticket: “BUKI-1581”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/BeastNqSiteMeanPos”
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_BROWSER, TG_BEAST, TG_DOPP, TG_UNDOCUMENTED, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_365D, TG_NN_OVER_FEATURES_USE, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Countries: CNT_TR
Description: “Average url position for a normalized query”
Authors: [“solar”, “vvp”]
Responsibles: [“solar”, “alsafr”, “tarum”, “niknik”]
}
Factor {
Index: 716
CppName: “FI_BEAST_NQUERY_OWNER_MEAN_POS”
Name: “BeastNqOwnerMeanPos”
Ticket: “BUKI-1581”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/BeastNqSiteMeanPos”
Tags: [TG_DYNAMIC, TG_DOWNER, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_BROWSER, TG_BEAST, TG_DOPP, TG_USER_SEARCH_EXTERNAL, TG_UNDOCUMENTED, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_365D, TG_NN_OVER_FEATURES_USE, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Countries: CNT_TR
Description: “Average position of domAttr by normalized query”
Authors: [“solar”, “vvp”]
Responsibles: [“solar”, “alsafr”, “tarum”, “niknik”]
}
Factor {
Index: 717
CppName: “FI_BEAST_URL_MEAN_POS”
Name: “BeastUrlMeanPos”
Ticket: “BUKI-1581”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/BeastSiteMeanPos”
Group: “RegDocStatic”
Tags: [TG_STATIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_BROWSER, TG_USER_EXT_DATA, TG_BEAST, TG_UNDOCUMENTED, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTOED, TG_USERFEAT, TG_USENNEAT_VER6]
Countries: CNT_TR
Description: “Average url position across all queries”
Authors: [“solar”, “vvp”]
Responsibles: [“solar”, “alsafr”, “tarum”, “niknik”]
}
Factor {
Index: 718
CppName: “FI_BEAST_HOST_MEAN_POS”
Name: “BeastHostMeanPos”
Ticket: “BUKI-1581”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/BeastSiteMeanPos”
Group: “RegHostStatic”
Tags: [TG_STATIC, TG_HOST, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_BROWSER, TG_USER_EXT_DATA, TG_BEAST, TG_UNDOCUMENTED, TG_L2, TG_DEPRECATED]
Countries: CNT_TR
Description: “Average host position across all queries”
Authors: [“solar”, “vvp”]
Responsibles: [“solar”, “alsafr”]
}
Factor {
Index: 719
CppName: “FI_BEAST_URL_NUM_QUERIES”
Name: “BeastUrlNumQueries”
Ticket: “BUKI-1581”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/BeastSiteNumQueries”
Group: “RegDocStatic”
Tags: [TG_STATIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_BROWSER, TG_USER_EXT_DATA, TG_BEAST, TG_UNDOCUMENTED, TG_L2, TG_DEPRECATED]
Countries: CNT_TR
Description: “Number of requests per url”
Authors: [“solar”, “vvp”]
Responsibles: [“solar”, “alsafr”]
}
Factor {
Index: 720
CppName: “FI_BEAST_HOST_NUM_QUERIES”
Name: “BeastHostNumQueries”
Ticket: “BUKI-1581”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/BeastSiteNumQueries”
Group: “RegHostStatic”
Tags: [TG_STATIC, TG_HOST, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_BROWSER, TG_USER_EXT_DATA, TG_BEAST, TG_UNDOCUMENTED, TG_L2, TG_USERFEAT, TG_USERFEAT_365D, TG_NN_OVER_FEATURES_USE]
Countries: CNT_TR
Description: “Number of requests per host”
Authors: [“solar”, “vvp”]
Responsibles: [“solar”, “alsafr”, “tarum”, “niknik”]
}
Factor {
Index: 721
CppName: “FI_YABAR_HOST_BROWSE_RANK_REG”
Name: “YabarHostBrowseRank_Reg”
Ticket: [“BUKI-1652”, “FACTOR-56”]
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/YaBarLogs”
Group: “RegHostStatic”
Tags: [TG_STATIC, TG_HOST, TG_USER, TG_BROWSER, TG_USER_EXT_DATA, TG_LOCALIZED_COUNTRY, TG_UNIMPLEMENTED, TG_L2]
Countries: CNT_RELEV
Description: “implementation of the algorithm described in the article ((http://wiki.yandex-team.ru//h.yandex.net/?http%3A%2F%2Fresearch.microsoft.com%2Fen-us%2Fpeople%2Ftyliu% 2Ffp032-liu.pdf http://research.microsoft.com/en-us/people/tyliu/fp032-liu.pdf)) by large regions (TUBE)”
Authors: “akhropov”
Responsibles: “akhropov”
}
Factor {
Index: 722
CppName: “FI_REMOVED_722”
Name: “Removed_722”
Tags: [TG_REMOVED]
}
Factor {
Index: 723
CppName: “FI_SEGMENT_WORD_PORTION_FROM_MAINCONTENT”
Name: “SegmentWordPortionFromMainContent”
Ticket: “BUKI-1671”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/SegmentWordPortionFromMaincontent”
Tags: [TG_DOC, TG_DOC_TEXT, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “Proportion of document words from segments with score > 2.”
Authors: “nordic”
Responsibles: “nordic”
}
Factor {
Index: 724
CppName: “FI_URL_DOMAIN_SIMILARITY_FIXED”
Name: “UrlDomainSimilarityFixed”
Ticket: “BUKI-1647”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/urldomainsimilarity”
Group: “Dynamic”
Tags: [TG_HOST, TG_DYNAMIC, TG_URL_TEXT, TG_UNDOCUMENTED, TG_REARR_USE, TG_L2, TG_NN_OVER_FEATURES_USE, TG_FORMULA_2245_DEP_2, TG_DEPRECATED]
Authors: “alsafr”
Responsibles: “alsafr”
}
Factor {
Index: 725
CppName: “FI_TOTAL_DUPS”
Name: “Total Dups”
Ticket: FORMULATOR-185
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/IsIndexPage”
Tags: [TG_DOC, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_NN_OVER_FEATURES_USE]
Authors: “smikler”
Responsibles: “alsafr”
}
Factor {
Index: 726
CppName: “FI_RANK_BOOST_GOODNESS”
Name: “RankBoost Goodness”
Ticket: [“FACTOR-32”, “SEARCHSPAM-3858”, “SEARCHSPAM-4133”]
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/RankBoostGoodness”
Tags: [TG_COMMERCIAL, TG_OWNER, TG_STATIC, TG_LOCALIZED_COUNTRY, TG_UNDOCUMENTED, TG_L2, TG_MASCOT, TG_NN_OVER_FEATURES_USE]
Countries: CNT_RU
Description: “Site quality rank used for boosts of the Moscow commercial formula”
Authors: [“burmisha”, “sisoid”]
Responsibles: “efedina”
}
Factor {
Index: 727
CppName: “FI_QUERY_DOWNER_CLICKS_FRC_REG_GEO”
Name: “QueryDOwnerClicksFRCRegGeo”
Ticket: “QREG-31”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/GeoClicks”
Tags: [TG_DYNAMIC, TG_DOWNER, TG_LOCALIZED_CITY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_USER_SEARCH_EXTERNAL, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_90D, TG_USERFEAT_CLICKS_SHOWS, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Authors: “esoloviev”
Responsibles: [“esoloviev”, “yazevnul”, “niknik”, “tarum”]
}
Factor {
Index: 728
CppName: “FI_QUERY_URL_CLICKS_FRC_REG_GEO”
Name: “QueryURLClicksFRCRegGeo”
Ticket: “QREG-31”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/GeoClicks”
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_CITY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_90D, TG_USERFEAT_CLICKS_SHOWS, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Authors: “esoloviev”
Responsibles: [“esoloviev”, “yazevnul”, “niknik”, “tarum”]
}
Factor {
Index: 729
CppName: “FI_LANGUAGE_DISTRIBUTION”
Name: “Language Distribution”
Ticket: “BUKI-1396”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/LanguageDistribution”
Tags: [TG_DYNAMIC, TG_DOC, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_UNDOCUMENTED, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_CLICKS_SHOWS, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Authors: “avatar”
Responsibles: [“avatar”, “tarum”, “niknik”]
}
Factor {
Index: 730
CppName: “FI_URL_SHOWS_WITH_NEXT_PAGE_CLICKS_P1”
Name: “UrlShowsWithNextPageClicksP1”
Ticket: “BUKI-1549”
Wiki: “http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/obshayaformula/tekushhiekomponenty/ShowsWithNextPageClicks”
Group: “RegDocStatic”
Tags: [TG_LOCALIZED_COUNTRY, TG_STATIC, TG_DOC, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_USF, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Authors: “morph”
Responsibles: [“alsafr”, “tarum”, “niknik”]
}
Factor {
Index: 731
CppName: “FI_URL_SHOWS_WITH_NEXT_PAGE_CLICKS_P10”
Name: “UrlShowsWithNextPageClicksP10”
Ticket: “BUKI-1549”
Wiki: “http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/obshayaformula/tekushhiekomponenty/ShowsWithNextPageClicks”
Description: “Factor used in SelectionRank. TG_UNUSED: should not be included in formulas to avoid feedback”
Group: “RegDocStatic”
Tags: [TG_LOCALIZED_COUNTRY, TG_STATIC, TG_DOC, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_UNUSED, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2]
Authors: “morph”
Responsibles: “alsafr”
}
Factor {
Index: 732
CppName: “FI_URL_CLICKS_PCTR_YEAR”
Name: “QueryURLClicksPCTRYear”
AntiSeoUpperBound: 0.6
Tags: [TG_DYNAMIC, TG_DOC, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_REARR_USE, TG_UNUSED, TG_OFTEN_ZERO]
Ticket: “BUKI-1658”
Wiki: “http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/obshayaformula/tekushhiekomponenty/QueryUrlClicksPCTRYear”
Authors: “apos”
Responsibles: “apos”
}
Factor {
Index: 733
CppName: “FI_URL_CLICKS_PCTR_YEARP”
Name: “QueryURLClicksPCTRPreviousYear”
AntiSeoUpperBound: 0.6
Ticket: “BUKI-1658”
Tags: [TG_DYNAMIC, TG_DOC, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_REARR_USE, TG_UNUSED, TG_OFTEN_ZERO]
Wiki: “http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/obshayaformula/tekushhiekomponenty/QueryUrlClicksPCTRYear”
Authors: “apos”
Responsibles: “apos”
}
Factor {
Index: 734
CppName: “FI_SMALL_WINDOW_ATTENUATION”
Name: “SmallWindowAttenuation”
Ticket: “FACTOR-28”
Wiki: “http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/obshayaformula/tekushhiekomponenty/SmallWindow”
Group: “Combined Abs”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_UNDOCUMENTED, TG_DEPRECATED]
Responsibles: “alsafr”
}
Factor {
Index: 735
CppName: “FI_RC_SEARCH_BASE_URL_RATIONAL_SIGMOID_D3T120_AT_REQ”
Name: “RcSearchBaseUrlRationalSigmoidD3T120AtReq”
Group: “Rapid Clicks”
Tags: [TG_STATIC, TG_DOC, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_L2, TG_SEARCH_RAPID_CLICKS_BIGRT, TG_DATA_FROM_BIGRT, TG_UNDOCUMENTED, TG_UNUSED]
Description: “URL feature computed at the request time from rapid clicks search counters with decay of 3 days”
Ticket: “USERFEAT-1503”
Authors: [“skorodumov-s”]
Responsibles: [“skorodumov-s”, “tarum”]
ImplementationTime: “2020-10-04”
}
Factor {
Index: 736
CppName: “FI_OWNER_CTR_WITH_NEXT_PAGE_CLICKS_P10”
Name: “OwnerCTRWithNextPageClicksP10”
Ticket: “FACTOR-30”
Wiki: “http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/obshayaformula/tekushhiekomponenty/ShowsWithNextPageClicks”
Group: “RegHostStatic”
Tags: [TG_LOCALIZED_COUNTRY, TG_STATIC, TG_OWNER, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_OFTEN_ZERO, TG_L2, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_USF, TG_2RECEPATE_D]
Authors: “vvp”
Responsibles: [“alsafr”, “tarum”, “niknik”]
}
Factor {
Index: 737
CppName: “FI_COMM_RUS”
Name: “CommRus”
Ticket: [“FACTOR-31”, “SEARCHSPAM-3722”]
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/CommRus”
Tags: [TG_COMMERCIAL, TG_DOC, TG_STATIC, TG_LOCALIZED_COUNTRY, TG_UNDOCUMENTED, TG_L2, TG_NN_OVER_FEATURES_USE]
Countries: CNT_RU
Description: “The weight of the document according to the one-word dictionary of commercial vocabulary”
Authors: “sisoid”
Responsibles: [“bikulov”, “ashagarov”]
}
Factor {
Index: 738
CppName: “FI_WIKI_LINK_COUNT”
Name: “WikiLinkCount”
Ticket: “FACTOR-54”
Wiki: “http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/obshayaformula/tekushhiekomponenty/WikiLinkCount”
Tags: [TG_DOC, TG_LINK_GRAPH, TG_STATIC, TG_USER, TG_WIKIPEDIA, TG_UNDOCUMENTED, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_1D, TG_NN_OVER_FEATURES_USE]
Authors: [“sokirko”, “bogomolov”]
Responsibles: [“alsafr”, “tarum”, “niknik”]
}
Factor {
Index: 739
CppName: “FI_URL_IN_LINKS_TRIGRAMS_STATIC”
Name: “UrlInLinksTrigramsStatic”
Ticket: “FACTOR-43”
Wiki: “http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/UrlLinksTrigramsStatic”
Tags: [TG_DOC, TG_LINK_TEXT, TG_STATIC, TG_URL_TEXT, TG_L2, TG_UNUSED]
Authors: “vvp”
Responsibles: “alsafr”
}
Factor {
Index: 740
CppName: “FI_LINKS_IN_URL_TRIGRAMS_STATIC”
Name: “LinksInUrlTrigramsStatic”
Ticket: “FACTOR-43”
Wiki: “http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/UrlLinksTrigramsStatic”
Tags: [TG_DOC, TG_LINK_TEXT, TG_STATIC, TG_URL_TEXT, TG_L2, TG_UNUSED]
Authors: “vvp”
Responsibles: “alsafr”
}
Factor {
Index: 741
CppName: “FI_UKR_IS_QUERY_LANG”
Name: “UkrIsQueryLang”
Ticket: “FACTOR-51”
Wiki: “http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/obshayaformula/tekushhiekomponenty/UkrIsQueryLang”
Tags: [TG_QUERY_ONLY, TG_BINARY, TG_DYNAMIC, TG_UNDOCUMENTED, TG_NN_OVER_FEATURES_USE]
Description: “Shows that the request is in Ukrainian”
Authors: “vvp”
Responsibles: “alsafr”
}
Factor {
Index: 742
CppName: “FI_QUERIES_AVG_CM2”
Name: “QueriesAvgCM2”
Ticket: “FACTOR-66”
Wiki: “http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/obshayaformula/tekushhiekomponenty/QueriesAvgCM2”
Tags: [TG_STATIC, TG_OWNER, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_COMMERCIAL, TG_L2, TG_MASCOT, TG_UNDOCUMENTED, TG_NN_OVER_FEATURES_USE]
Countries: [CNT_RU, CNT_TR]
Description: “Average query commerciality”
Authors: [“burmisha”, “sisoid”]
Responsibles: “efedina”
}
Factor {
Index: 743
CppName: “FI_QI_QUERY_COUNT”
Name: “QiQueryCount”
Group: “QI”
Ticket: “FACTOR-63”
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_L2, TG_USER_SEARCH_EXTERNAL, TG_DEPRECATED]
Description: “Number of requests in the group of frequency requests similar to the given one”
Authors: [“agorodilov”, “morph”]
Responsibles: [“smikler”, “tsimkha”]
Wiki: “https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/oldqifactors”
}
Factor {
Index: 744
CppName: “FI_QI_URL_FREQ_WEIGHTED_FRC”
Name: “QiUrlFreqWeightedFRC”
Group: “QI”
Ticket: “FACTOR-63”
Tags: [TG_DYNAMIC, TG_DOC, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_L2, TG_DEPRECATED]
Description: “FRC groups of frequency queries similar to the given one, averaged over the sum of clicks and impressions”
Authors: [“agorodilov”, “morph”]
Responsibles: [“smikler”, “tsimkha”]
Wiki: “https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/oldqifactors”
}
Factor {
Index: 745
CppName: “FI_QI_URL_FREQ_WEIGHTED_FRC_REG”
Name: “QiUrlFreqWeightedFRCReg”
Group: “QI”
Ticket: “FACTOR-63”
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_REGION, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_L2, TG_DEPRECATED]
Countries: CNT_RELEV
Description: “FRC groups of frequency queries similar to the given one, averaged over the sum of clicks and impressions, according to regional statistics”
Authors: “morph”
Responsibles: [“smikler”, “tsimkha”]
Wiki: “https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/oldqifactors”
}
Factor {
Index: 746
CppName: “FI_RC_SEARCH_BASE_URL_RATIONAL_SIGMOID_D1TM600_FROZEN”
Name: “RcSearchBaseUrlRationalSigmoidD1TM600Frozen”
Group: “Rapid Clicks”
Tags: [TG_STATIC, TG_DOC, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_L2, TG_SEARCH_RAPID_CLICKS_BIGRT, TG_DATA_FROM_BIGRT, TG_UNDOCUMENTED, TG_UNUSED]
Description: “URL feature computed from rapid clicks search frozen counters with decay of 1 day”
Ticket: “USERFEAT-1503”
Authors: [“skorodumov-s”]
Responsibles: [“skorodumov-s”, “tarum”]
ImplementationTime: “2020-10-04”
}
Factor {
Index: 747
CppName: “FI_WORD_HOST_WIKI_SUM”
Name: “WordHostWikiSum”
Ticket: “BUKI-1515”
Wiki: “http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/regwordhost”
Group: “RegWordHost”
Tags: [TG_DYNAMIC, TG_HOST, TG_WIKIPEDIA, TG_LINK_GRAPH, TG_DEPRECATED]
Description: “The relative popularity of the word-host pair, where word is the word from the title of the Wikipedia article and host is the host that is referenced in this article.”
Authors: “smikler”
Responsibles: [“smikler”, “tsimkha”]
}
Factor {
Index: 748
CppName: “FI_REG_WORD_HOST_CLICKS_SUM”
Name: “RegWordHostClicksSum”
Ticket: “BUKI-1515”
Wiki: “http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/regwordhost”
Group: “RegWordHost”
Tags: [TG_DYNAMIC, TG_HOST, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_DEPRECATED]
Countries: CNT_RELEV
Description: “Relative click-through rate of the triple countryId-word-host according to searches in Yandex.”
Authors: “smikler”
Responsibles: [“smikler”, “tsimkha”]
}
Factor {
Index: 749
CppName: “FI_REG_WORD_HOST_YABAR_SUM”
Name: “RegWordHostYabarSum”
Ticket: “BUKI-1515”
Wiki: “http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/regwordhost”
Group: “RegWordHost”
Tags: [TG_DYNAMIC, TG_HOST, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_BROWSER, TG_USER_EXT_DATA, TG_DEPRECATED]
Countries: CNT_RELEV
Description: “Relative click-through rate of the triple countryId-word-host according to data from popular search engines in the logs of Bar and SimilarGroup.”
Authors: “smikler”
Responsibles: [“smikler”, “tsimkha”]
}
Factor {
Index: 750
CppName: “FI_REGEX_MAX_CLICK_PERCENT_YABAR_REG”
Name: “RegexMaxClickPercentYabarReg”
Ticket: “FACTOR-11”
Wiki: “http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/regexmaxclickpercent”
Group: “Regex”
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_BROWSER, TG_USER_SEARCH, TG_USER_EXT_DATA, TG_L2, TG_DEPRECATED]
Countries: CNT_RELEV
Description: “Percentage of clicks on this URL among all clicks on similar queries, calculated by popular search engine”
Authors: [“smikler”, “kcd”]
Responsibles: [“smikler”, “tsimkha”]
}
Factor {
Index: 751
CppName: “FI_YABAR_HOST_SURFTR_DEPTH_NODES_LEAFLN”
Name: “YabarHostSurfTrDpNdLeafLn”
Ticket: “BUKI-1334”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/HostStatistics”
Tags: [TG_STATIC, TG_HOST, TG_USER, TG_BROWSER, TG_USER_SEARCH, TG_L2, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_SURFING_TREE]
Description: “Lobe length Depth Nodes calculated for hosts”
Authors: [“atolstikov”, “smikler”]
Responsibles: [“atolstikov”, “tarum”, “niknik”]
}
Factor {
Index: 752
CppName: “FI_YABAR_HOST_SURFTR_NODES_TIME_GRDISP”
Name: “YabarHostSurfTrNdTmGrDsp”
Ticket: “BUKI-1334”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/HostStatistics”
Tags: [TG_STATIC, TG_HOST, TG_USER, TG_BROWSER, TG_USER_SEARCH, TG_L2, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_SURFING_TREE]
Description: “Angle variance in Nodes Time space calculated for hosts”
Authors: [“atolstikov”, “smikler”]
Responsibles: [“atolstikov”, “tarum”, “niknik”]
}
Factor {
Index: 753
CppName: “FI_YABAR_HOST_SURFTR_NODES_TIME_LEADFLN90”
Name: “YabarHostSurfTrNdTmLeafLn90”
Ticket: “BUKI-1334”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/HostStatistics”
Tags: [TG_STATIC, TG_HOST, TG_USER, TG_BROWSER, TG_USER_SEARCH, TG_L2, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_SURFING_TREE]
Description: “0.9-quantile of lobe length in Nodes Time space calculated for hosts”
Authors: [“atolstikov”, “smikler”]
Responsibles: [“atolstikov”, “tarum”, “niknik”]
}
Factor {
Index: 754
CppName: “FI_WORD_HOST_DOWNLOAD_PROBABILITY”
Name: “WordHostDownloadProbability”
Ticket: “FACTOR-44”
Wiki: “http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/regwordhost”
Group: “RegWordHost”
Tags: [TG_DYNAMIC, TG_HOST, TG_USER, TG_BROWSER, TG_USER_SEARCH, TG_DEPRECATED]
Description: “Average probability of downloading a file from a host after a click, according to the query.”
Authors: [“osenzen”, “smikler”]
Responsibles: [“smikler”, “tsimkha”]
}
Factor {
Index: 755
CppName: “FI_NASTY_CONTENT”
Name: “NastyContent”
Ticket: [“FACTOR-113”, “SEARCHSPAM-2435”]
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/NastyContent”
Tags: [TG_STATIC, TG_DOC, TG_THEME_CLASSIF, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “Content nasty factor.”
Authors: “melkov”
Responsibles: “alsafr”
}
Factor {
Index: 756
CppName: “FI_URL_SYNNORM_PCTR”
Name: “SynnormURLPCTR”
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_SYNNORM, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_90D, TG_USERFEAT_CLICKS_SHOWS, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Countries: CNT_RELEV
Ticket: “FACTOR-72”
Wiki: “wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/obshayaformula/tekushhiekomponenty/SynnormFeatures”
Description: “CTR by click data, query normalized by synsets”
Authors: [“rizar”, “ekrokhalev”]
Responsibles: [“tarum”, “niknik”]
}
Factor {
Index: 757
CppName: “FI_URL_SYNNORM_PCTR_REG”
Name: “SynnormURLPCTRReg”
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_REGION, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_SYNNORM, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_90D, TG_USERFEAT_CLICKS_SHOWS, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Ticket: “FACTOR-72”
Wiki: “wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/obshayaformula/tekushhiekomponenty/SynnormFeatures”
Description: “Regional CTR by click data, query normalized by synsets”
Authors: [“rizar”, “ekrokhalev”]
Responsibles: [“tarum”, “niknik”]
}
Factor {
Index: 758
CppName: “FI_URL_QUERY_TRIGRAMS_STATIC”
Name: “UrlQueryTrigramsStatic”
Group: “RegDocStatic”
Tags: [TG_LOCALIZED_COUNTRY, TG_STATIC, TG_DOC, TG_USER, TG_BROWSER, TG_USER_SEARCH, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_UNDOCUMENTED, TG_USERFEAT, TG_USERFEAT_238D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_URL_QUERY_TRIGRAMS]
Ticket: “FACTOR-24”
Wiki: “http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/obshayaformula/tekushhiekomponenty/UrlQueryTrigramsStatic”
Description: “Static trigrams intercection of url and queries by which users visited the url.”
Authors: “vvp”
Responsibles: [“alsafr”, “tarum”, “niknik”]
}
Factor {
Index: 759
CppName: “FI_ADV_ASPAM”
Name: “AdvAspam”
Ticket: “BUKI-1757”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/AdvAspam”
Tags: [TG_COMMERCIAL, TG_OWNER, TG_STATIC, TG_UNDOCUMENTED, TG_L2, TG_MASCOT, TG_NN_OVER_FEATURES_USE]
Authors: [“burmisha”,”sisoid”]
Responsibles: “efedina”
}
Factor {
Index: 760
CppName: “FI_HAS_PORNO_QUERY”
Name: “HasPornoQuery”
DependsOn: [{Feature: [“HasPornoQuery”], Slice: “begemot_query_factors”}]
Ticket: “FACTOR-123”
Wiki: “https://jira.yandex-team.ru/browse/FACTOR-123”
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_DEPRECATED]
Description: “The result of the adult sorcerer’s rule.”
Authors: “zagrebin”
Responsibles: “smikler”
}
Factor {
Index: 761
CppName: “FI_QU_BM15_WEIGHTED”
Name: “QUBm15Weighted”
Group: “Annotation”
Ticket: “FACTOR-21”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/QUFactors”
Tags: [TG_DYNAMIC, TG_DOC, TG_USER, TG_USER_SEARCH, TG_BROWSER, TG_USER_EXT_DATA, TG_ANNOTATION_FILTER, TG_L2, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_MULTI_PERIOD]
Description: “Weighted BM15 for a query by document index – a list of queries that were linked to it.”
Authors: “alsafr”
Responsibles: “alsafr”
}
Factor {
Index: 762
CppName: “FI_WS_IS_INDEX_PAGE_AND_BOCM”
Name: “WeightedSumIsIndexPageBocm”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_TRANS, TG_NN_OVER_FEATURES_USE]
Ticket: “FACTOR-140”
Authors: [“burmisha”, “sisoid”]
Responsibles: “sisoid”
DependsOn: [{Feature: [“IsIndexPage”, “Bocm”]}]
}
Factor {
Index: 763
CppName: “FI_WS_IS_INDEX_PAGE_AND_QUERY_IS_NAV_MX”
Name: “WeightedSumIsIndexPageIsNavMxQuery”
Tags: [TG_DEPRECATED, TG_DYNAMIC, TG_DOC, TG_NAV, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_TRANS, TG_NN_OVER_FEATURES_USE]
Countries: CNT_RU
Ticket: “FACTOR-140”
Authors: [“burmisha”, “sisoid”]
Responsibles: “sisoid”
DependsOn: [{Feature: [“IsIndexPage”, “IsNavMxQuery”]}]
}
Factor {
Index: 764
CppName: “FI_BROWSER_HOST_DOWNLOAD_PROBABILITY”
Name: “BrowserHostDownloadProbability”
Ticket: “FACTOR-44”
Wiki: “https://jira.yandex-team.ru/browse/FACTOR-44”
Tags: [TG_STATIC, TG_HOST, TG_USER, TG_BROWSER, TG_USER_SEARCH, TG_L2, TG_DEPRECATED]
Description: “Probability of jumping from the host after clicking (according to Bar’s logs).”
Authors: [“osenzen”, “smikler”]
Responsibles: “smikler”
}
Factor {
Index: 765
CppName: “FI_NHOP_CHAINS_COUNT_FRC”
Name: “NHopChainsCountFrc”
Group: “RegDocStatic”
Tags: [TG_STATIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_BROWSER, TG_USER_EXT_DATA, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_238D, TG_NN_OVER_FEATURES_EAT_ TG_USE]
Countries: CNT_RELEV
Ticket: “FACTOR-97”
Wiki: “wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/NHopStatic”
Description: “Number of threads per request / (number of threads the url participated in + number of threads per request).”
Authors: “vvp”
Responsibles: [“alsafr”, “kartynnik”, “tarum”, “niknik”]
}
Factor {
Index: 766
CppName: “FI_NHOP_IS_FINAL”
Name: “NHopIsFinal”
Group: “RegDocStatic”
Tags: [TG_STATIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_BROWSER, TG_USER_EXT_DATA, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_238D, TG_NN_OVER_FEATURES_EAT_ TG_USE]
Countries: CNT_RELEV
Ticket: “FACTOR-97”
Wiki: “wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/NHopStatic”
Description: “The number of threads in which the url was last, normalized by the total number of threads in which this url was.”
Authors: “vvp”
Responsibles: [“alsafr”, “kartynnik”, “tarum”, “niknik”]
}
Factor {
Index: 767
CppName: “FI_VISITS_FROM_WIKI”
Name: “VisitsFromWiki”
Group: “RegDocStatic”
Tags: [TG_STATIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_BROWSER, TG_USER_EXT_DATA, TG_WIKIPEDIA, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVERFEAT_FEATURES]
Countries: CNT_RELEV
Ticket: “FACTOR-46”
Wiki: “wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/obshayaformula/tekushhiekomponenty/VisitsFromWiki”
Description: “Number of clicks to URL from Wikipedia”
Authors: [“bogomolov”, “smikler”]
Responsibles: [“alsafr”, “tarum”, “niknik”]
}
Factor {
Index: 768
CppName: “FI_RC_SEARCH_BASE_URL_CONTRAST_D30ODD0_9_X_D30T1_FROZEN”
Name: “RcSearchBaseUrlContrastD30Odd0_9_X_D30T1Frozen”
Group: “Rapid Clicks”
Tags: [TG_STATIC, TG_DOC, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_L2, TG_DATA_FROM_BIGRT, TG_SEARCH_RAPID_CLICKS_BIGRT, TG_UNDOCUMENTED, TG_UNUSED]
Description: “URL feature computed from rapid clicks search frozen counters with decay of 30 days”
Ticket: “USERFEAT-1503”
Authors: [“skorodumov-s”]
Responsibles: [“skorodumov-s”, “tarum”]
ImplementationTime: “2020-10-04”
}
Factor {
Index: 769
CppName: “FI_REG_BROWSER_USER_HUB”
Name: “RegBrowserUserHub”
Ticket: “FACTOR-120”
Wiki: “https://jira.yandex-team.ru/browse/FACTOR-120”
Tags: [TG_STATIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_BROWSER, TG_USER_EXT_DATA, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERF]
Countries: CNT_RELEV
Group: “RegDocStatic”
Description: “Indicator of the page as a hub (how many pages Bar users go to from it).”
Authors: [“vvp”, “smikler”]
Responsibles: [“smikler”, “tarum”, “niknik”]
}
Factor {
Index: 770
CppName: “FI_AUX_TITLE_BM25”
Name: “AuxTitleBM25”
Ticket: “FACTOR-160”
Group: “AuxBM25”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_LOCALIZED_CITY, TG_REARR_USE, TG_UNDOCUMENTED, TG_L2, TG_DEPRECATED]
Description: “It is considered TextBM25 in the title by the text of the name of the user’s region – similar to the factor 268.”
Authors: “esoloviev”
Responsibles: “esoloviev”
}
Factor {
Index: 771
CppName: “FI_BCLMF”
Name: “Bclmf”
Group: “Annotation”
Ticket: “FACTOR-149”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/QUFactors”
Tags: [TG_DYNAMIC, TG_DOC, TG_USER, TG_BROWSER, TG_USER_SEARCH, TG_USER_EXT_DATA, TG_DOC_TEXT, TG_LINK_TEXT, TG_ANNOTATION_FILTER, TG_DEPRECATED]
Description: “BCLM for Annotation index, doc text and links.”
Authors: “alsafr”
Responsibles: “alsafr”
}
Factor {
Index: 772
CppName: “FI_NO_PRODUCTS_PROBABILITY”
Name: “NoProductsProbability”
Ticket: “COMMERCIAL-64”
Authors: [“hygge”, “alejes”, “kpolitay”]
Responsibles: [“hygge”, “alejes”]
Description: “Dssm prediction of the probability by url + title that there are no products on the page.”
Tags: [TG_L2, TG_NEURAL, TG_URL_TEXT, TG_STATIC, TG_NN_OVER_FEATURES_USE]
ImplementationTime: “2020-10-04”
}
Factor {
Index: 773
CppName: “FI_PSE_FRC_BROWSER”
Name: “PopularSEFRCBrowser”
Ticket: “FACTOR-193”
Wiki: “http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/obshayaformula/tekushhiekomponenty/PopularSEFRC”
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_REGION, TG_USER, TG_BROWSER, TG_USER_SEARCH, TG_DOPP, TG_UNDOCUMENTED, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_238D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_POPULAR_SE_FRC, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Description: “FRC of the popular browser log search engine”
Authors: [“vvp”, “zagrebin”, “bogomolov”]
Responsibles: [“alsafr”, “tarum”, “niknik”]
}
Factor {
Index: 774
CppName: “FI_LOG_CTR_MEAN”
Name: “LogCtrMean”
Ticket: “FACTOR-182”
Wiki: “http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/LogCtrMean”
Tags: [TG_STATIC, TG_HOST, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_L2, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_CLICKS_SHOWS, TG_FORMULA_2245, TG_DEP_DEP_3]
Description: “Weighted mean of log(query_clicks)/log(query_shows) for given host. Weights are proportional to log(query_shows) + 0.2.”
Authors: “tsimkha”
Responsibles: [“tarum”, “niknik”]
}
Factor {
Index: 775
CppName: “FI_QUERY_URL_NHOP_TOTAL_FRC”
Name: “QueryUrlNhopTotalFrc”
Ticket: “FACTOR-145”
Wiki: “http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/NHopQueryUrl”
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_REGION, TG_USER, TG_BROWSER, TG_USER_EXT_DATA, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_238D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_NHOP, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Description: “The number of clicks per request to the url occurring in hop chains, normalized by the total number of clicks on the request.”
Authors: “vvp”
Responsibles: [“alsafr”, “tarum”, “niknik”]
}
Factor {
Index: 776
CppName: “FI_QUERY_URL_NHOP_IS_FINAL”
Name: “QueryUrlNhopIsFinal”
Ticket: “FACTOR-145”
Wiki: “http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/NHopQueryUrl”
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_REGION, TG_USER, TG_BROWSER, TG_USER_EXT_DATA, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_238D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_NHOP, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Description: “Probability of the url to be the last query in the hop chain.”
Authors: “vvp”
Responsibles: [“alsafr”, “tarum”, “niknik”]
}
Factor {
Index: 777
CppName: “FI_ONE_PRODUCT_PROBABILITY”
Name: “OneProductProbability”
Ticket: “COMMERCIAL-64”
Authors: [“hygge”, “alejes”, “kpolitay”]
Responsibles: [“hygge”, “alejes”]
Description: “Dssm probability prediction by url + title that there is only one product on the page.”
Tags: [TG_L2, TG_NEURAL, TG_STATIC, TG_URL_TEXT, TG_NN_OVER_FEATURES_USE]
ImplementationTime: “2020-10-04”
}
Factor {
Index: 778
CppName: “FI_MANY_PRODUCTS_PROBABILITY”
Name: “ManyProductsProbability”
Ticket: “COMMERCIAL-64”
Authors: [“hygge”, “alejes”, “kpolitay”]
Responsibles: [“hygge”, “alejes”]
Description: “Dssm prediction of the probability by url + title that there are a lot of products on the page.”
Tags: [TG_L2, TG_NEURAL, TG_STATIC, TG_URL_TEXT, TG_NN_OVER_FEATURES_USE]
ImplementationTime: “2020-10-04”
}
Factor {
Index: 779
CppName: “FI_RC_SEARCH_BASE_URL_RATIONAL_SIGMOID_D3T120_FROZEN”
Name: “RcSearchBaseUrlRationalSigmoidD3T120Frozen”
Group: “Rapid Clicks”
Tags: [TG_STATIC, TG_DOC, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_L2, TG_SEARCH_RAPID_CLICKS_BIGRT, TG_DATA_FROM_BIGRT, TG_UNDOCUMENTED, TG_UNUSED]
Description: “URL feature computed from rapid clicks search frozen counters with decay of 3 days”
Ticket: “USERFEAT-1503”
Authors: [“skorodumov-s”]
Responsibles: [“skorodumov-s”, “tarum”]
ImplementationTime: “2020-10-04”
}
Factor {
Index: 780
CppName: “FI_GEO_CITY_URL_HAS_CITY”
Name: “GeoCityUrlHasCity”
Ticket: “BUKI-1125”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/GeoCityUrl”
Tags: [TG_DOC, TG_STATIC, TG_STATIC_REGINFO, TG_URL_TEXT, TG_BINARY, TG_DEPRECATED, TG_OFTEN_ZERO, TG_L2]
Description: “City level georeference defined for url according to BUKI-1125 rules”
Authors: “denplusplus”
Responsibles: “esoloviev”
}
Factor {
Index: 781
CppName: “FI_GEO_CITY_URL_HAS_COUNTRY”
Name: “GeoCityUrlHasCountry”
Ticket: “BUKI-1125”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/GeoCityUrl”
Tags: [TG_DOC, TG_STATIC, TG_STATIC_REGINFO, TG_URL_TEXT, TG_BINARY, TG_DEPRECATED, TG_OFTEN_ZERO, TG_L2]
Description: “Url has country-level georeference defined according to BUKI-1125 rules”
Authors: “denplusplus”
Responsibles: “esoloviev”
}
Factor {
Index: 782
CppName: “FI_GEO_RELEV_REGION_CITY_GEOA”
Name: “GeoRelevRegionCityGeoa”
Ticket: “QREG-41”
Tags: [TG_DOC, TG_DYNAMIC, TG_LOCALIZED_CITY, TG_BINARY, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “GeoRelevRegionCity factor by geoa attribute”
Authors: “esoloviev”
Responsibles: “esoloviev”
}
Factor {
Index: 783
CppName: “FI_GEO_RELEV_REGION_REGION_GEOA”
Name: “GeoRelevRegionRegionGeoa”
Ticket: “QREG-41”
Tags: [TG_DOC, TG_DYNAMIC, TG_LOCALIZED_REGION, TG_BINARY, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “GeoRelevRegionRegion factor by geoa attribute”
Authors: “esoloviev”
Responsibles: “esoloviev”
}
Factor {
Index: 784
CppName: “FI_GEO_GEOMETRY_PROXIM_GEOA”
Name: “GeoGeometryProximGeoa”
Ticket: “QREG-41”
Tags: [TG_DOC, TG_DYNAMIC, TG_LOCALIZED_CITY, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “GeoGeometryProxim factor by geoa attribute”
Authors: “esoloviev”
Responsibles: “esoloviev”
}
Factor {
Index: 785
CppName: “FI_GEO_RELEV_ALIEN_CITY_GEOA”
Name: “GeoRelevAlienCityGeoa”
Ticket: “QREG-41”
Tags: [TG_DOC, TG_DYNAMIC, TG_LOCALIZED_CITY, TG_BINARY, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “GeoRelevAlienCity factor by geoa attribute”
Authors: “esoloviev”
Responsibles: “esoloviev”
}
Factor {
Index: 786
CppName: “FI_GEO_V_QUERY_IN_USERS_CITY_GEOA”
Name: “GeoVQueryInUserCityGeoa”
Ticket: “QREG-41”
Tags: [TG_DOC, TG_DYNAMIC, TG_LOCALIZED_CITY, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “GeoVQueryInUserCity factor by geoa attribute”
Authors: “esoloviev”
Responsibles: “esoloviev”
}
Factor {
Index: 787
CppName: “FI_GEO_V_QUERY_IN_ALIEN_CITY_GEOA”
Name: “GeoVQueryInAlienCityGeoa”
Ticket: “QREG-41”
Tags: [TG_DOC, TG_DYNAMIC, TG_LOCALIZED_CITY, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “GeoVQueryInAlienCity factor by geoa attribute”
Authors: “esoloviev”
Responsibles: “esoloviev”
}
Factor {
Index: 788
CppName: “FI_PAGE_REGION_SIZE_GEO”
Name: “PageRegionSizeGeo”
Ticket: “QREG-41”
Tags: [TG_DOC, TG_STATIC, TG_STATIC_REGINFO, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_NN_OVER_FEATURES_USE]
Description: “PageRegionSize factor by geo attribute”
Authors: “esoloviev”
Responsibles: “esoloviev”
}
Factor {
Index: 789
CppName: “FI_PAGE_REGION_COVERAGE_GEO”
Name: “PageRegionCoverageGeo”
Ticket: “QREG-41”
Tags: [TG_DOC, TG_STATIC, TG_STATIC_REGINFO, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_NN_OVER_FEATURES_USE]
Description: “PageRegionCoverage factor by geo attribute”
Authors: “esoloviev”
Responsibles: “esoloviev”
}
Factor {
Index: 790
CppName: “FI_PAGE_REGION_COVERAGE_ADRESA”
Name: “PageRegionCoverageAddress”
Ticket: “QREG-41”
Tags: [TG_DOC, TG_STATIC, TG_STATIC_REGINFO, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “PageRegionCoverage factor by adresa attribute”
Authors: “esoloviev”
Responsibles: “esoloviev”
}
Factor {
Index: 791
CppName: “FI_GEO_RELEV_REGION_CITY_ADRESA”
Name: “GeoRelevRegionCityAddress”
Ticket: “QREG-41”
Tags: [TG_DOC, TG_DYNAMIC, TG_LOCALIZED_CITY, TG_BINARY, TG_UNDOCUMENTED, TG_OFTEN_ZERO, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “GeoRelevRegionCity factor by adresa attribute”
Authors: “esoloviev”
Responsibles: “esoloviev”
}
Factor {
Index: 792
CppName: “FI_DOPP_URL_SESSION_CLICKS_FRC”
Name: “DoppQueryUrlSessionClicksFRC”
Ticket: “FACTOR-127”
Wiki: “http://wiki.yandex-team.ru/JandeksPoisk/KachestvoPoiska/ObshayaFormula/TekushhieKomponenty/DoppQueryUrlSessionClicksFRC”
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_DOPP, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_90D, TG_USERFEAT_USF, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Countries: CNT_RELEV
Description: “What percentage (on average per session) of URLs clicked on this query is this url. Calculated by user sessions.”
Authors: “alsafr”
Responsibles: [“kolesov93”, “alsafr”]
}
Factor {
Index: 793
CppName: “FI_OWNER_IS_ACTUAL_SHOP”
Name: “OwnerIsActualShop”
Tags: [TG_OWNER, TG_STATIC, TG_L2, TG_COMMERCIAL]
Description: “Ovner is a store”
Ticket: “COMMERCIAL-62”
Authors: [“miha715lev”, “alejes”]
Responsibles: [“miha715lev”, “alejes”]
ImplementationTime: “2020-09-30”
}
Factor {
Index: 794
CppName: “FI_OWNER_IS_SERVICE”
Name: “OwnerIsService”
Tags: [TG_OWNER, TG_STATIC, TG_L2, TG_COMMERCIAL, TG_UNUSED, TG_UNIMPLEMENTED]
Description: “Owner is a service”
Ticket: “COMMERCIAL-62”
Authors: [“miha715lev”, “alejes”]
Responsibles: [“miha715lev”, “alejes”]
}
Factor {
Index: 795
CppName: “FI_NHOP_TEXT_BCLM_PLANE”
Name: “NHopTextBclmPlane”
Group: “Annotation”
Ticket: “FACTOR-108”
Wiki: “http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/NHopText”
Tags: [TG_DYNAMIC, TG_DOC, TG_USER, TG_BROWSER, TG_USER_SEARCH, TG_USER_EXT_DATA, TG_LOCALIZED_COUNTRY, TG_ANNOTATION_FILTER, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_238D, TG_USERFEAT_NHOP]
Countries: CNT_RELEV
Description: “Bclm (plane) based on lyrics from hops.”
Authors: “vvp”
Responsibles: “alsafr”
}
Factor {
Index: 796
CppName: “FI_SAME_QUERY_FRC_BROWSER”
Name: “SameQueryReturnFRCBrowser”
Ticket: “FACTOR-234”
Wiki: “http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/samequeryreturn”
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_BROWSER, TG_USER_SEARCH, TG_DOPP, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_238D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_SAME_QUERY_RETURN, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Countries: CNT_RELEV
Description: “FRC on referrals from requests that were set by the user several times”
Authors: [“bogomolov”, “vvp”]
Responsibles: [“smikler”, “tarum”, “niknik”]
}
Factor {
Index: 797
CppName: “FI_QUERY_URL_ISBM_CTR”
Name: “QueryURLISBMCTR”
Wiki: “http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/isbm”
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_SBM, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Countries: CNT_RELEV
Ticket: “FACTOR-65”
Description: “Average weight of impressions on the first page; clicks weight 1, non-clicks – according to the SBM_GAMMAS table”
Authors: [“shpilman”, “dprpavlin”]
Responsibles: [“dprpavlin”, “tarum”, “niknik”]
}
Factor {
Index: 798
CppName: “FI_QUERY_URL_ISBM_CTR_REG”
Name: “QueryURLISBMCTRReg”
Wiki: “http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/isbm”
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_REGION, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_SBM, TG_2EPDRECATE5]
Ticket: “FACTOR-65”
Description: “Average weight of impressions on the first page; clicks weight 1, non-clicks – according to the SBM_GAMMAS table. Regional version”
Authors: [“shpilman”, “dprpavlin”]
Responsibles: [“dprpavlin”, “tarum”, “niknik”]
}
Factor {
Index: 799
CppName: “FI_REGEX_BEAST_POSITION_REG”
Name: “RegexBeastPositionReg”
Ticket: “FACTOR-268”
Wiki: “http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/regexbeastpositionreg”
Group: “Regex”
Tags: [TG_DOC, TG_DYNAMIC, TG_USER, TG_USER_SEARCH, TG_BROWSER, TG_USER_EXT_DATA, TG_BEAST, TG_LOCALIZED_COUNTRY, TG_L2, TG_DEPRECATED]
Countries: CNT_TR
Description: “half the sum of the url position score with the median position for all similar queries by bist”
Authors: [“avatar”, “vvp”]
Responsibles: [“avatar”, “smikler”, “tsimkha”]
}
Factor {
Index: 800
CppName: “FI_RC_SPYLOG_HOST_RATIONAL_SIGMOID_D3T0_AT_REQ”
Name: “RcSpylogHostRationalSigmoidD3T0AtReq”
Group: “Rapid Clicks”
Tags: [TG_STATIC, TG_HOST, TG_USER, TG_BROWSER, TG_L2, TG_DATA_FROM_BIGRT, TG_UNDOCUMENTED, TG_UNIMPLEMENTED, TG_UNUSED]
Description: “Host feature computed at the request time from rapid clicks spy_log counters with decay of 3 days”
Ticket: “USERFEAT-1508”
Authors: [“skorodumov-s”]
Responsibles: [“skorodumov-s”, “tarum”]
}
Factor {
Index: 801
CppName: “FI_RC_SPYLOG_HOST_RATIONAL_SIGMOID_D3T0DTM3600_AT_REQ”
Name: “RcSpylogHostRationalSigmoidD3DTM3600AtReq”
Group: “Rapid Clicks”
Tags: [TG_STATIC, TG_HOST, TG_USER, TG_BROWSER, TG_L2, TG_DATA_FROM_BIGRT, TG_UNDOCUMENTED, TG_UNIMPLEMENTED, TG_UNUSED]
Description: “Host feature computed at the request time from rapid clicks spy_log counters with decay of 3 days”
Ticket: “USERFEAT-1508”
Authors: [“skorodumov-s”]
Responsibles: [“skorodumov-s”, “tarum”]
}
Factor {
Index: 802
CppName: “FI_RC_SPYLOG_HOST_RATIONAL_SIGMOID_D14T0_AT_REQ”
Name: “RcSpylogHostRationalSigmoidD14T0AtReq”
Group: “Rapid Clicks”
Tags: [TG_STATIC, TG_HOST, TG_USER, TG_BROWSER, TG_L2, TG_DATA_FROM_BIGRT, TG_UNDOCUMENTED, TG_UNIMPLEMENTED, TG_UNUSED]
Description: “Host feature computed at the request time from rapid clicks spy_log counters with decay of 14 days”
Ticket: “USERFEAT-1508”
Authors: [“skorodumov-s”]
Responsibles: [“skorodumov-s”, “tarum”]
}
Factor {
Index: 803
CppName: “FI_RC_SPYLOG_HOST_RATIONAL_SIGMOID_D14DTM3600_AT_REQ”
Name: “RcSpylogHostRationalSigmoidD14DTM3600AtReq”
Group: “Rapid Clicks”
Tags: [TG_STATIC, TG_HOST, TG_USER, TG_BROWSER, TG_L2, TG_DATA_FROM_BIGRT, TG_UNDOCUMENTED, TG_UNIMPLEMENTED, TG_UNUSED]
Description: “Host feature computed at the request time from rapid clicks spy_log counters with decay of 14 days”
Ticket: “USERFEAT-1508”
Authors: [“skorodumov-s”]
Responsibles: [“skorodumov-s”, “tarum”]
}
Factor {
Index: 804
CppName: “FI_RC_SPYLOG_HOST_RATIONAL_SIGMOIDED_CTRD3DT0TM3600_AT_REQ”
Name: “RcSpylogHostRationalSigmoidedCTRD3DT0TM3600AtReq”
Group: “Rapid Clicks”
Tags: [TG_STATIC, TG_HOST, TG_USER, TG_BROWSER, TG_L2, TG_DATA_FROM_BIGRT, TG_UNDOCUMENTED, TG_UNIMPLEMENTED, TG_UNUSED]
Description: “Host feature computed at the request time from rapid clicks spy_log counters with decay of 3 days”
Ticket: “USERFEAT-1508”
Authors: [“skorodumov-s”]
Responsibles: [“skorodumov-s”, “tarum”]
}
Factor {
Index: 805
CppName: “FI_RC_SPYLOG_HOST_RATIONAL_SIGMOIDED_CTRD14DT0TM3600_AT_REQ”
Name: “RcSpylogHostRationalSigmoidedCTRD14DT0TM3600AtReq”
Group: “Rapid Clicks”
Tags: [TG_STATIC, TG_HOST, TG_USER, TG_BROWSER, TG_L2, TG_DATA_FROM_BIGRT, TG_UNDOCUMENTED, TG_UNIMPLEMENTED, TG_UNUSED]
Description: “Host feature computed at the request time from rapid clicks spy_log counters with decay of 14 days”
Ticket: “USERFEAT-1508”
Authors: [“skorodumov-s”]
Responsibles: [“skorodumov-s”, “tarum”]
}
Factor {
Index: 806
CppName: “FI_RC_SPYLOG_HOST_RATIONAL_SIGMOID_D3T0_FROZEN”
Name: “RcSpylogHostRationalSigmoidD3T0Frozen”
Group: “Rapid Clicks”
Tags: [TG_STATIC, TG_HOST, TG_USER, TG_BROWSER, TG_L2, TG_DATA_FROM_BIGRT, TG_UNDOCUMENTED, TG_UNIMPLEMENTED, TG_UNUSED]
Description: “Host feature computed from rapid clicks spy_log counters with decay of 3 days”
Ticket: “USERFEAT-1508”
Authors: [“skorodumov-s”]
Responsibles: [“skorodumov-s”, “tarum”]
}
Factor {
Index: 807
CppName: “FI_RC_SPYLOG_HOST_RATIONAL_SIGMOID_D3T0DTM3600_FROZEN”
Name: “RcSpylogHostRationalSigmoidD3DTM3600Frozen”
Group: “Rapid Clicks”
Tags: [TG_STATIC, TG_HOST, TG_USER, TG_BROWSER, TG_L2, TG_DATA_FROM_BIGRT, TG_UNDOCUMENTED, TG_UNIMPLEMENTED, TG_UNUSED]
Description: “Host feature computed from rapid clicks spy_log counters with decay of 3 days”
Ticket: “USERFEAT-1508”
Authors: [“skorodumov-s”]
Responsibles: [“skorodumov-s”, “tarum”]
}
Factor {
Index: 808
CppName: “FI_RC_SPYLOG_HOST_RATIONAL_SIGMOID_D14T0_FROZEN”
Name: “RcSpylogHostRationalSigmoidD14T0Frozen”
Group: “Rapid Clicks”
Tags: [TG_STATIC, TG_HOST, TG_USER, TG_BROWSER, TG_L2, TG_DATA_FROM_BIGRT, TG_UNDOCUMENTED, TG_UNIMPLEMENTED, TG_UNUSED]
Description: “Host feature computed from rapid clicks spy_log counters with decay of 14 days”
Ticket: “USERFEAT-1508”
Authors: [“skorodumov-s”]
Responsibles: [“skorodumov-s”, “tarum”]
}
Factor {
Index: 809
CppName: “FI_RC_SPYLOG_HOST_RATIONAL_SIGMOID_D14DTM3600_FROZEN”
Name: “RcSpylogHostRationalSigmoidD14DTM3600Frozen”
Group: “Rapid Clicks”
Tags: [TG_STATIC, TG_HOST, TG_USER, TG_BROWSER, TG_L2, TG_DATA_FROM_BIGRT, TG_UNDOCUMENTED, TG_UNIMPLEMENTED, TG_UNUSED]
Description: “Host feature computed from rapid clicks spy_log counters with decay of 14 days”
Ticket: “USERFEAT-1508”
Authors: [“skorodumov-s”]
Responsibles: [“skorodumov-s”, “tarum”]
}
Factor {
Index: 810
CppName: “FI_RC_SPYLOG_HOST_RATIONAL_SIGMOIDED_CTRD3DT0TM3600_FROZEN”
Name: “RcSpylogHostRationalSigmoidedCTRD3DT0TM3600Frozen”
Group: “Rapid Clicks”
Tags: [TG_STATIC, TG_HOST, TG_USER, TG_BROWSER, TG_L2, TG_DATA_FROM_BIGRT, TG_UNDOCUMENTED, TG_UNIMPLEMENTED, TG_UNUSED]
Description: “Host feature computed from rapid clicks spy_log counters with decay of 3 days”
Ticket: “USERFEAT-1508”
Authors: [“skorodumov-s”]
Responsibles: [“skorodumov-s”, “tarum”]
}
Factor {
Index: 811
CppName: “FI_RC_SPYLOG_HOST_RATIONAL_SIGMOIDED_CTRD14DT0TM3600_FROZEN”
Name: “RcSpylogHostRationalSigmoidedCTRD14DT0TM3600Frozen”
Group: “Rapid Clicks”
Tags: [TG_STATIC, TG_HOST, TG_USER, TG_BROWSER, TG_L2, TG_DATA_FROM_BIGRT, TG_UNDOCUMENTED, TG_UNIMPLEMENTED, TG_UNUSED]
Description: “Host feature computed from rapid clicks spy_log counters with decay of 14 days”
Ticket: “USERFEAT-1508”
Authors: [“skorodumov-s”]
Responsibles: [“skorodumov-s”, “tarum”]
}
Factor {
Index: 812
CppName: “FI_COMMERCIAL_DSSM_ODD_LIKE”
Name: “CommercialDssmOddLike”
Tags: [TG_DYNAMIC, TG_DOC, TG_USER, TG_USER_SEARCH, TG_DOC_TEXT, TG_URL_TEXT, TG_NEURAL, TG_COMMERCIAL, TG_RTMODELS_SERVICE, TG_NN_OVER_FEATURES_USE]
Description: “Finetuned reformulations DSSM to commercial clicked bargain odd-like target from visit log”
Ticket: “FORMULA-2001”
Authors: [“alexumnov”]
Responsibles: [“alexumnov”]
ImplementationTime: “2020-11-12”
}
Factor {
Index: 813
CppName: “FI_DISTRIBUTOR_HOSTS”
Name: “DistributorHosts”
Tags: [TG_OWNER, TG_STATIC, TG_OFTEN_ZERO, TG_UNIMPLEMENTED, TG_BINARY, TG_UNUSED]
Description: “Is legal video distributor”
Ticket: “SEARCHSPAM-15565”
Authors: [“bikulov”]
Responsibles: [“bikulov”, “sdormidontov”]
}
Factor {
Index: 814
CppName: “FI_ONE_PRODUCT_PROBABILITY_AVG”
Name: “OneProductProbabilityAvg”
Ticket: “SEARCHSPAM-15568”
Authors: [“ulyan”]
Responsibles: [“ulyanov”, “bikulov”]
Description: “Average value of feature OneProductProbability”
Tags: [TG_OWNER, TG_STATIC, TG_OFTEN_ZERO, TG_UNUSED, TG_UNIMPLEMENTED]
}
Factor {
Index: 815
CppName: “FI_MANY_PRODUCTS_PROBABILITY_AVG”
Name: “ManyProductsProbabilityAvg”
Ticket: “SEARCHSPAM-15568”
Authors: [“ulyan”]
Responsibles: [“ulyanov”, “bikulov”]
Description: “Average value of feature ManyProductsProbability”
Tags: [TG_OWNER, TG_STATIC, TG_OFTEN_ZERO, TG_UNUSED, TG_UNIMPLEMENTED]
}
Factor {
Index: 816
CppName: “FI_PAY_DETECTOR_PREDICT_AVG”
Name: “PayDetectorPredictAvg”
Ticket: “SEARCHSPAM-15568”
Authors: [“ulyan”]
Responsibles: [“ulyanov”, “bikulov”]
Description: “Average value of feature PayDetectorPredict”
Tags: [TG_OWNER, TG_STATIC, TG_OFTEN_ZERO, TG_UNUSED, TG_UNIMPLEMENTED]
}
Factor {
Index: 817
CppName: “FI_OWNER_IS_PARTNER”
Name: “OwnerIsPartner”
Tags: [TG_OWNER, TG_STATIC, TG_L2, TG_COMMERCIAL, TG_UNUSED, TG_UNIMPLEMENTED]
Description: “Ovner is a partner”
Ticket: “COMMERCIAL-90”
Authors: [“miha715lev”, “alejes”]
Responsibles: [“miha715lev”, “alejes”]
}
Factor {
Index: 818
CppName: “FI_SHOP_IN_SHOP_URL”
Name: “ShopInShopUrl”
Tags: [TG_DOC, TG_STATIC, TG_L2, TG_OFTEN_ZERO, TG_COMMERCIAL, TG_UNUSED, TG_UNIMPLEMENTED]
Description: “Document is ShopInShop”
Ticket: “COMMERCIAL-135”
Authors: [“miha715lev”, “alejes”]
Responsibles: [“miha715lev”, “alejes”]
}
Factor {
Index: 819
CppName: “FI_QUERY_CONVERSION_DETECTOR_PREDICT”
Name: “QueryConversionDetectorPredict”
Ticket: “COMMERCIAL-81”
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_USER, TG_L2, TG_QUERY_DETECTOR_PREDICT, TG_NOT_01, TG_UNUSED]
Description: “The value of the query conversion rate calculated in the behemoth.”
Authors: [“alejes”, “hygge”]
Responsibles: [“alejes”, “hygge”]
MaxValue: 25.0
MinValue: -25.0
ImplementationTime: “2020-12-01”
}
Factor {
Index: 820
CppName: “FI_FIO_FROM_ORIGINAL_REQUEST_BODY_CHAIN0_WCM”
Name: “FioFromOriginalRequestBodyChain0Wcm”
Ticket: “SEARCHSPEC-94”
Description: “Factor by full name from the original request Considered by the content of the document. Algorithm: Chain0Wcm”
Tags: [TG_DOC, TG_DOC_TEXT, TG_UNDOCUMENTED, TG_UNIMPLEMENTED, TG_TEXT_MACHINE]
}
Factor {
Index: 821
CppName: “FI_PRODUCT_OFFER_ANY_AVAILABLE”
Name: “ProductOfferAnyAvailable”
Ticket: “COMMERCIAL-78”
Authors: [“hygge”, “alejes”]
Responsibles: [“hygge”, “alejes”]
Description: “At least one offer from the parsed schema has an availability status.”
Tags: [TG_L2, TG_STATIC, TG_OFTEN_ZERO]
ImplementationTime: “2020-04-07”
}
Factor {
Index: 822
CppName: “FI_PRODUCT_OFFER_NO_PRODUCTS”
Name: “ProductOfferNoProducts”
Ticket: “COMMERCIAL-78”
Authors: [“hygge”, “alejes”]
Responsibles: [“hygge”, “alejes”]
Description: “There are no offers in the parsed scheme.”
Tags: [TG_L2, TG_STATIC]
ImplementationTime: “2020-04-07”
}
Factor {
Index: 823
CppName: “FI_BAD_YTIER_URL”
Name: “BadYtierUrl”
Tags: [TG_STATIC, TG_DOC, TG_UNUSED, TG_UNIMPLEMENTED, TG_OFTEN_ZERO, TG_USER_SEARCH, TG_META, TG_L3, TG_PRS]
Authors: “hommforever”
Responsibles: [“hommforever”]
Ticket: “SEARCHSPEC-25”
Wiki: “”
DependsOn: []
Description: “The url from ytier is known to have low quality content”
}
Factor {
Index: 824
CppName: “FI_NORM_YTIER_URL”
Name: “NormYtierUrl”
Tags: [TG_STATIC, TG_DOC, TG_UNUSED, TG_UNIMPLEMENTED, TG_OFTEN_ZERO, TG_USER_SEARCH, TG_META, TG_L3, TG_PRS]
Authors: “hommforever”
Responsibles: [“hommforever”]
Ticket: “SEARCHSPEC-25”
Wiki: “”
DependsOn: []
Description: “The url from ytier is known to have acceptable quality content”
}
Factor {
Index: 825
CppName: “FI_GOOD_YTIER_URL”
Name: “GoodYtierUrl”
Tags: [TG_STATIC, TG_DOC, TG_UNUSED, TG_UNIMPLEMENTED, TG_OFTEN_ZERO, TG_USER_SEARCH, TG_META, TG_L3, TG_PRS]
Authors: “hommforever”
Responsibles: [“hommforever”]
Ticket: “SEARCHSPEC-25”
Wiki: “”
DependsOn: []
Description: “The url from ytier is known to have good quality content”
}
Factor {
Index: 826
CppName: “FI_BEST_YTIER_URL”
Name: “BestYtierUrl”
Tags: [TG_STATIC, TG_DOC, TG_UNUSED, TG_UNIMPLEMENTED, TG_OFTEN_ZERO, TG_USER_SEARCH, TG_META, TG_L3, TG_PRS]
Authors: “hommforever”
Responsibles: [“hommforever”]
Ticket: “SEARCHSPEC-25”
Wiki: “”
DependsOn: []
Description: “The url from ytier is known to have great quality content”
}
Factor {
Index: 827
CppName: “FI_HOST_IS_ECOM_PURCHASE”
Name: “HostIsEcomPurchase”
Ticket: “COMMERCIAL-124”
Authors: [“hygge”, “alejes”]
Responsibles: [“hygge”, “alejes”]
Description: “The host has an ECOM purchase.”
Tags: [TG_HOST, TG_STATIC, TG_OFTEN_ZERO, TG_UNUSED, TG_UNIMPLEMENTED]
}
Factor {
Index: 828
CppName: “FI_HOST_IS_VISIT_LOGS_PURCHASE”
Name: “HostIsVisitLogsPurchase”
Ticket: “COMMERCIAL-124”
Authors: [“hygge”, “alejes”]
Responsibles: [“hygge”, “alejes”]
Description: “There is a VISIT LOG purchase on the host.”
Tags: [TG_HOST, TG_STATIC, TG_OFTEN_ZERO, TG_UNUSED, TG_UNIMPLEMENTED]
}
Factor {
Index: 829
CppName: “FI_YANDEX_MARKET_PRODUCT_URL”
Name: “YandexMarketProductUrl”
Tags: [TG_DOC, TG_URL_TEXT, TG_BINARY, TG_OFTEN_ZERO, TG_L2, TG_UNUSED, TG_UNIMPLEMENTED]
Description: “URL is a product on Market.”
Ticket: “COMMERCIAL-128”
Authors: [“hygge”, “alejes”]
Responsibles: [“hygge”, “alejes”]
# ImplementationTime: “2020-12-04”
}
Factor {
Index: 830
CppName: “FI_YANDEX_MARKET_PRODUCT_INCLUDE_OFFERID_URL”
Name: “YandexMarketProductIncludeOfferidUrl”
Tags: [TG_DOC, TG_URL_TEXT, TG_BINARY, TG_OFTEN_ZERO, TG_L2, TG_UNUSED, TG_UNIMPLEMENTED]
Description: “The URL is a product on the Market and has an offerid.”
Ticket: “COMMERCIAL-128”
Authors: [“hygge”, “alejes”]
Responsibles: [“hygge”, “alejes”]
# ImplementationTime: “2020-12-04”
}
Factor {
Index: 831
CppName: “FI_SHOP_IN_SHOP_CPA_URL”
Name: “ShopInShopCPAUrl”
Tags: [TG_DYNAMIC, TG_DOC, TG_URL_TEXT, TG_BINARY, TG_OFTEN_ZERO, TG_L2, TG_UNUSED, TG_UNIMPLEMENTED]
Description: “URL is ShopInShopCPA.”
Ticket: “COMMERCIAL-183”
Authors: [“hygge”, “alejes”]
Responsibles: [“hygge”, “alejes”]
# ImplementationTime: “2020-03-18”
}
Factor {
Index: 832
CppName: “FI_PRODUCT_OFFER_NOT_AVAILABLE”
Name: “ProductOfferNotAvailable”
Ticket: “COMMERCIAL-78”
Authors: [“hygge”, “alejes”]
Responsibles: [“hygge”, “alejes”]
Description: “At least one offer from the parsed schema has an unavailable status.”
Tags: [TG_L2, TG_STATIC, TG_OFTEN_ZERO]
ImplementationTime: “2020-04-07”
}
Factor {
Index: 833
CppName: “FI_OWNER_IS_ECOM_PURCHASE”
Name: “OwnerIsEcomPurchase”
Ticket: “COMMERCIAL-124”
Authors: [“hygge”, “alejes”]
Responsibles: [“hygge”, “alejes”]
Description: “The owner has an ECOM purchase.”
Tags: [TG_OWNER, TG_STATIC, TG_OFTEN_ZERO, TG_UNUSED]
ImplementationTime: “2020-12-17”
}
Factor {
Index: 834
CppName: “FI_OWNER_IS_VISIT_LOGS_PURCHASE”
Name: “OwnerIsVisitLogsPurchase”
Ticket: “COMMERCIAL-124”
Authors: [“hygge”, “alejes”]
Responsibles: [“hygge”, “alejes”]
Description: “The owner has a VISIT LOG purchase.”
Tags: [TG_HOST, TG_STATIC, TG_OFTEN_ZERO, TG_UNUSED, TG_UNIMPLEMENTED]
}
Factor {
Index: 835
CppName: “FI_NAV_PARASITES”
Name: “NavParasites”
Ticket: “FACTOR-2471”
Authors: [“hygge”, “alejes”, “polandr”]
Responsibles: [“hygge”, “alejes”]
Description: “Dssm predicts the probability by url + title that the document is a freeloader.”
Tags: [TG_L2, TG_NEURAL, TG_URL_TEXT, TG_STATIC, TG_NOT_01, TG_UNUSED, TG_ALLOW_USE_FOR_SPAM_FORMULAS]
ImplementationTime: “2022-01-01”
MinValue: -0.5
MaxValue: 1.5
}
Factor {
Index: 836
CppName: “FI_OFFER_AVAILABILITY_IS_SET_UP”
Name: “OfferAvailabilityIsSetUp”
Ticket: “COMMERCIAL-186”
Authors: [“hygge”, “alejes”]
Responsibles: [“hygge”, “alejes”]
Description: “The PartnerOfferContent available field is set in the offer from the new parser.”
Tags: [TG_L2, TG_STATIC, TG_OFTEN_ZERO, TG_UNUSED, TG_UNIMPLEMENTED]
}
Factor {
Index: 837
CppName: “FI_OFFER_AVAILABILITY”
Name: “Offer Availability”
Ticket: “COMMERCIAL-186”
Authors: [“hygge”, “alejes”]
Responsibles: [“hygge”, “alejes”]
Description: “In the offer from the new parser, the field PartnerOfferContent available == true.”
Tags: [TG_L2, TG_STATIC, TG_OFTEN_ZERO, TG_UNUSED, TG_UNIMPLEMENTED]
}
Factor {
Index: 838
CppName: “FI_URL_CLICKS_MAX_GEO_CITY_FRC_WEIGHT”
Name: “URLClicksMaxGeoCityFRCWeight”
Ticket: “FACTOR-36”
Wiki: “http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/URLClicksMaxGeoCityFRC”
Tags: [TG_DOC, TG_STATIC, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_L2, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_90D, TG_USERFEAT_GEOCLICKS]
Description: “Normalized corrected clicks count by query with user’s city(gc=) mentioned”
Authors: “esoloviev”
Responsibles: [“tarum”, “niknik”]
}
Factor {
Index: 839
CppName: “FI_URL_CLICKS_MAX_GEO_CITY_FRC_RATIO”
Name: “URLClicksMaxGeoCityFRCRatio”
Ticket: “FACTOR-36”
Wiki: “http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/URLClicksMaxGeoCityFRC”
Tags: [TG_DOC, TG_DYNAMIC, TG_LOCALIZED_CITY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_L2, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_90D, TG_USERFEAT_GEOCLICKS]
Description: “Normalized corrected clicks maximum ratio by query with user’s city(gc=) mentioned”
Authors: “esoloviev”
Responsibles: [“tarum”, “niknik”]
}
Factor {
Index: 840
CppName: “FI_URL_CLICKS_MAX_ALIEN_GEO_CITY_FRC_RATIO”
Name: “URLClicksMaxGeoAlienCityFRCRatio”
Ticket: “FACTOR-36”
Wiki: “http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/URLClicksMaxGeoCityFRC”
Tags: [TG_DOC, TG_DYNAMIC, TG_LOCALIZED_CITY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_L2, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_90D, TG_USERFEAT_GEOCLICKS]
Description: “Normalized corrected clicks maximum ratio by query with not user’s city(gc=) mentioned”
Authors: “esoloviev”
Responsibles: [“tarum”, “niknik”]
}
Factor {
Index: 841
CppName: “FI_FAST_MX”
Name: “FastMx”
Ticket: “FACTOR-271”
Wiki: “http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/FastMx”
Tags: [TG_DOC, TG_DYNAMIC, TG_TRANS, TG_UNUSED]
Authors: [“vmordovin”, “sisoid”]
Responsibles: [“vmordovin”, “sisoid”]
}
Factor {
Index: 842
CppName: “FI_PURCHASE_TOTAL_PREDICT”
Name: “PurchaseTotalPredict”
Ticket: “COMMERCIAL-190”
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_USER, TG_L2, TG_QUERY_DETECTOR_PREDICT, TG_NOT_01, TG_UNUSED, TG_UNIMPLEMENTED]
Description: “PurchaseTotalPredict value calculated in hippopotamus.”
Authors: [“alejes”, “hygge”]
Responsibles: [“alejes”, “hygge”]
MinValue: -10
MaxValue: 10
}
Factor {
Index: 843
CppName: “FI_SERP_SUMMARY_SURPLUS_PREDICT”
Name: “SerpSummarySurplusPredict”
Ticket: “COMMERCIAL-190”
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_USER, TG_L2, TG_QUERY_DETECTOR_PREDICT, TG_UNUSED, TG_UNIMPLEMENTED]
Description: “The SerpSummarySurplusPredict value calculated in the behemoth.”
Authors: [“alejes”, “hygge”]
Responsibles: [“alejes”, “hygge”]
}
Factor {
Index: 844
CppName: “FI_YABAR_URL_REVISITS”
Name: “YabarUrlRevisits”
Wiki: “http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/Revisits”
Ticket: “FACTOR-186”
Tags: [TG_STATIC, TG_DOC, TG_USER, TG_BROWSER, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_90D, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_REVISITS]
Description: “Returning user to url”
Authors: [“shpilman”, “atolstikov”]
Responsibles: [“atolstikov”, “tarum”, “niknik”]
}
Factor {
Index: 845
CppName: “FI_REQUEST_WITH_120_D3_CLICK_PART_PREDICT”
Name: “RequestWith120D3ClickPartPredict”
Ticket: “COMMERCIAL-190”
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_USER, TG_L2, TG_QUERY_DETECTOR_PREDICT, TG_NOT_01, TG_UNUSED, TG_UNIMPLEMENTED]
Description: “The value of RequestWith120D3ClickPartPredict calculated in the behemoth.”
Authors: [“alejes”, “hygge”]
Responsibles: [“alejes”, “hygge”]
MinValue: -10
MaxValue: 110
}
Factor {
Index: 846
CppName: “FI_QUERY_NAV_PARASITES_DETECTOR_PREDICT”
Name: “QueryNavParasitesDetectorPredict”
Ticket: “COMMERCIAL-190”
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_USER, TG_L2, TG_QUERY_DETECTOR_PREDICT, TG_UNUSED]
Description: “The value of the Freeloader Query Detector calculated in Behemoth.”
Authors: [“alejes”, “hygge”, “i-vainn”]
Responsibles: [“alejes”, “hygge”]
ImplementationTime: “2022-01-01”
}
Factor {
Index: 847
CppName: “FI_BROWSER_HOST_CNT_DWELL_TIME_LOG”
Name: “BrowserHostCntDwellTimeLog”
Group: “RegHostStatic”
Wiki: “https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/YabarUrlVisitsRegions”
Ticket: “FACTOR-324”
Tags: [TG_STATIC, TG_USER, TG_HOST, TG_BROWSER, TG_LOCALIZED_COUNTRY, TG_L2, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_90D, TG_USERFEAT_REG_SITE_BROWSER]
Countries: CNT_RELEV
Description: “Logarithm of the average time spent by a user on a host with localization by country; calculated from Yabar logs”
Authors: [“gotmanov”, “vvp”, “esoloviev”]
Responsibles: [“gotmanov”, “alsafr”]
}
Factor {
Index: 848
CppName: “FI_BROWSER_HOST_DWELL_TIME_REGION_FRC”
Name: “BrowserHostDwellTimeRegionFrc”
Group: “RegHostStatic”
Wiki: “https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/YabarUrlVisitsRegions”
Ticket: “FACTOR-324”
Tags: [TG_STATIC, TG_USER, TG_HOST, TG_BROWSER, TG_LOCALIZED_REGION, TG_L2, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_90D, TG_USERFEAT_REG_SITE_BROWSER]
Description: “The ratio of dwell time on a host in this region to dwell time on a host across all regions”
Authors: [“gotmanov”, “vvp”, “esoloviev”]
Responsibles: [“gotmanov”]
}
Factor {
Index: 849
CppName: “FI_BROWSER_URL_DWELL_TIME_REGION_FRC”
Name: “BrowserUrlDwellTimeRegionFrc”
Group: “RegDocStatic”
Wiki: “https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/YabarUrlVisitsRegions”
Ticket: “FACTOR-324”
Tags: [TG_STATIC, TG_USER, TG_DOC, TG_BROWSER, TG_LOCALIZED_REGION, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_90D, TG_USERFEAT_REG_SITE_BROWSER]
Description: “The ratio of dwell time on a page in this region to dwell time on a page for all regions”
Authors: [“gotmanov”, “vvp”, “esoloviev”]
Responsibles: [“gotmanov”]
}
Factor {
Index: 850
CppName: “FI_BROWSER_BOOKMARKS_URL”
Name: “BrowserBookmarksUrl”
Ticket: “FACTOR-310”
Wiki: “https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/BrowserBookmarks”
Tags: [TG_STATIC, TG_USER, TG_BROWSER, TG_DOC, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_NN_OVER_FEATURES_USE]
Description: “The more users add to bookmarks a url, the more factor value it has”
Authors: [“pavelgur”, “vvp”]
Responsibles: [“pavelgur”, “tarum”, “niknik”]
}
Factor {
Index: 851
CppName: “FI_SOS_DSSM”
Name: “SosDssm”
Ticket: “FACTOR-2475”
Authors: [“hygge”, “alejes”, “anrodigina”, “hommforever”]
Responsibles: [“hygge”, “alejes”]
Description: “Predict sos.dssm model by url + title.”
Tags: [TG_L2, TG_NEURAL, TG_URL_TEXT, TG_STATIC, TG_NOT_01, TG_USED_IN_CONF_REARR]
MinValue: -1
MaxValue: 1
ImplementationTime: “2021-03-31”
}
Factor {
Index: 852
CppName: “FI_MED_DSSM”
Name: “MedDssm”
Ticket: “FACTOR-2475”
Authors: [“hygge”, “alejes”, “anrodigina”, “hommforever”]
Responsibles: [“hygge”, “alejes”]
Description: “Predict med.dssm model by url + title.”
Tags: [TG_L2, TG_NEURAL, TG_URL_TEXT, TG_STATIC, TG_NOT_01, TG_USED_IN_CONF_REARR]
MinValue: -10
MaxValue: 10
ImplementationTime: “2021-03-31”
}
Factor {
Index: 853
CppName: “FI_FIN_LAW_DSSM”
Name: “FinLawDssm”
Ticket: “FACTOR-2475”
Authors: [“hygge”, “alejes”, “anrodigina”, “hommforever”]
Responsibles: [“hygge”, “alejes”]
Description: “Predict fin_law.dssm model by url + title.”
Tags: [TG_L2, TG_NEURAL, TG_URL_TEXT, TG_STATIC, TG_UNUSED, TG_UNIMPLEMENTED]
}
Factor {
Index: 854
CppName: “FI_WIKI_INFOBOX”
Name: “WikiInfobox”
Ticket: “FACTOR-85”
Wiki: “https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/WikiInfobox”
Tags: [TG_STATIC, TG_DOC, TG_WIKIPEDIA, TG_USER, TG_LINK_GRAPH, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_1D, TG_NN_OVER_FEATURES_USE]
Description: “This URL is linked from Infoboxes on Wikipedia.”
Authors: [“dimavin”, “smikler”]
Responsibles: [“dimavin”, “smikler”, “tarum”, “niknik”]
}
Factor {
Index: 855
CppName: “FI_CRUELTY_DSSM”
Name: “CrueltyDssm”
Ticket: “FACTOR-2476”
Authors: [“hygge”, “alejes”, “anrodigina”, “hommforever”]
Responsibles: [“hygge”, “alejes”]
Description: “Predict cruelty.dssm model by url + title.”
Tags: [TG_L2, TG_NEURAL, TG_URL_TEXT, TG_STATIC, TG_UNUSED, TG_USED_IN_CONF_REARR, TG_NOT_01]
MinValue: -10
MaxValue: 10
}
Factor {
Index: 856
CppName: “FI_HALF_ECOM_PREDICT”
Name: “HalfEcomPredict”
Ticket: “COMMERCIAL-190”
Tags: [TG_DYNAMIC, TG_QUERY_ONLY, TG_USER, TG_L2, TG_QUERY_DETECTOR_PREDICT, TG_UNUSED, TG_UNIMPLEMENTED]
Description: “HalfEcomPredict value calculated in hippopotamus.”
Authors: [“alejes”, “hygge”]
Responsibles: [“alejes”, “hygge”]
}
Factor {
Index: 857
CppName: “FI_PREFIX_SUFFIX_MAX_CLICK_PERCENT_REG”
Name: “PrefixSuffixMaxClickPercentReg”
Ticket: “FACTOR-396”
Wiki: “http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/regexmaxclickpercent”
Group: “Regex”
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_L2, TG_DEPRECATED]
Countries: CNT_RELEV
Description: “A factor similar to RegexMaxClickPercentReg, but calculated from the preffix-suffix generalization.”
Authors: [“smikler”]
Responsibles: [“smikler”, “tsimkha”, “yustuken”]
}
Factor {
Index: 858
CppName: “FI_PREFIX_SUFFIX_MAX_CLICK_PERCENT_YABAR_REG”
Name: “PrefixSuffixMaxClickPercentYabarReg”
Ticket: “FACTOR-396”
Wiki: “http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/regexmaxclickpercent”
Group: “Regex”
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_BROWSER, TG_USER_SEARCH, TG_USER_EXT_DATA, TG_L2, TG_DEPRECATED]
Countries: CNT_RELEV
Description: “Factor similar to RegexMaxClickPercentYabarReg, but calculated from preffix-suffix generalization.”
Authors: [“smikler”]
Responsibles: [“smikler”, “tsimkha”, “yustuken”]
}
Factor {
Index: 859
CppName: “FI_DSSM_NAVIGATION_L2”
Name: “DssmNavigationL2”
Tags: [TG_DYNAMIC, TG_DOC, TG_USER, TG_USER_SEARCH, TG_URL_TEXT, TG_DOC_TEXT, TG_NEURAL, TG_L2]
Description: “Request-document navigation model.”
UseArtifact: {Name: “DssmNavigationL2”}
Ticket: “SEARCH-10934”
Authors: [“hygge”, “alejes”, “arrin”]
Responsibles: [“hygge”, “alejes”]
ImplementationTime: “2021-03-31”
}
Factor {
Index: 860
CppName: “FI_YABAR_HOST_SURFTR_NODES_HANGS_GRADIENT”
Name: “YabarHostSurfTrNdHgGr”
Ticket: “FACTOR-112”
Wiki: “http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/SurfTr-Hangs”
Tags: [TG_STATIC, TG_HOST, TG_USER, TG_BROWSER, TG_USER_SEARCH, TG_L2, TG_DEPRECATED]
Description: “Average tilt angle in the vertex-hover plane”
Authors: [“atolstikov”, “osenzen”]
Responsibles: “atolstikov”
}
Factor {
Index: 861
CppName: “FI_QUERY_URL_CORRECTED_CTR_XFACTOR”
Name: “QueryUrlCorrectedCtrXfactor”
Ticket: “FACTOR-397”
Wiki: “https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/QueryUrlCorrectedCtrXfactor”
Tags: [TG_DYNAMIC, TG_DOC, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_LOCALIZED_COUNTRY, TG_COLLABORATED, TG_USER, TG_L2, TG_DEPRECATED, TG_REMOVED]
Countries: [CNT_ALL, CNT_TR]
Description: “Url query factor. Value is the result of collaborative data filtering for the QueryUrlCorrectedCtr factor”
Authors: [“avatar”, “vvp”, “alsafr”]
Responsibles: [“avatar”, “alsafr”]
}
Factor {
Index: 862
CppName: “FI_FULL_MATRIX_NET”
Name: “FullMatrixNet”
Tags: [TG_DOC, TG_DYNAMIC, TG_TRANS, TG_UNUSED]
Ticket: “SAASSUP-3320”
Authors: [“derrior”]
Responsibles: [“derrior”]
Description: “MatrixNet Slow Ranking Model Value.”
}
Factor {
Index: 863
CppName: “FI_FAST_MATRIX_NET”
Name: “FastMatrixNet”
Tags: [TG_DOC, TG_DYNAMIC, TG_TRANS, TG_UNUSED]
Ticket: “SAASSUP-3320”
Authors: [“derrior”]
Responsibles: [“derrior”]
Description: “MatrixNet fast ranking model value.”
}
Factor {
Index: 864
CppName: “FI_FILTER_MATRIX_NET”
Name: “FilterMatrixNet”
Tags: [TG_DOC, TG_DYNAMIC, TG_TRANS, TG_UNUSED]
Ticket: “SAASSUP-3320”
Authors: [“derrior”]
Responsibles: [“derrior”]
Description: “The MatrixNet value of the filter model.”
}
Factor {
Index: 865
CppName: “FI_SMALL_WINDOW_ATTENUATION_Q”
Name: “SmallWindowAttenuationQ”
Ticket: “FACTOR-441”
Wiki: “http://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/obshayaformula/tekushhiekomponenty/SmallWindow”
Group: “Combined Abs”
Tags: [TG_DOC, TG_DOC_TEXT, TG_DYNAMIC, TG_DEPRECATED]
Authors: “alsafr”
Responsibles: “alsafr”
}
Factor {
Index: 866
CppName: “FI_QUERY_DOC_TITLE_RANGES_MATCHING_SCORE”
Name: “QueryDocTitleRangesMatchingScore”
Ticket: “FACTOR-353”
Wiki: “https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/QueryDocTitleRanges”
Tags: [TG_DYNAMIC, TG_DOC, TG_DOC_TEXT, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “Factor by the text of the request and the title (title) of the document, evaluation of the correspondence of numerical ranges with marker words”
Authors: [“gotmanov”, “magaz”]
Responsibles: [“gotmanov”, “magaz”]
}
Factor {
Index: 867
CppName: “FI_FULL_POLYNOM”
Name: “FullPolynom”
Tags: [TG_DOC, TG_DYNAMIC, TG_UNUSED, TG_TRANS]
Ticket: “SAAS-6009”
Authors: [“derrior”]
Responsibles: [“derrior”]
Description: “The Polynom value of the slow ranking model.”
}
Factor {
Index: 868
CppName: “FI_FAST_POLYNOM”
Name: “FastPolynom”
Tags: [TG_DOC, TG_DYNAMIC, TG_UNUSED, TG_TRANS]
Ticket: “SAAS-6009”
Authors: [“derrior”]
Responsibles: [“derrior”]
Description: “The Polynom value of the fast ranking model.”
}
Factor {
Index: 869
CppName: “FI_FILTER_POLYNOM”
Name: “FilterPolynom”
Tags: [TG_DOC, TG_DYNAMIC, TG_UNUSED, TG_TRANS]
Ticket: “SAAS-6009”
Authors: [“derrior”]
Responsibles: [“derrior”]
Description: “The Polynom value of the filtering ranking model.”
}
Factor {
Index: 870
CppName: “FI_IS_TRANSLATED_DOCUMENT”
Name: “IsTranslatedDocument”
Tags: [TG_DOC, TG_STATIC, TG_L2, TG_UNUSED, TG_UNIMPLEMENTED]
Ticket: “MT-14803”
Authors: [“bvshuryg”]
Responsibles: [“bvshuryg”]
Description: “Indicator that the document was received by machine translation”
}
Factor {
Index: 871
CppName: “FI_MED_DSSM_WITH_TRASH”
Name: “MedDssmWithTrash”
Ticket: “SENS-177”
Authors: [“hygge”, “alejes”, “anrodigina”, “hommforever”, “nenashevna”]
Responsibles: [“hygge”, “alejes”]
Description: “Prediction med_with_trash.dssm (med. document model with trash added to lern) model by url + title.”
MinValue: -2.0
MaxValue: 2.0
Tags: [TG_L2, TG_NEURAL, TG_URL_TEXT, TG_STATIC, TG_UNUSED, TG_UNIMPLEMENTED, TG_NOT_01]
}
Factor {
Index: 872
CppName: “FI_FIN_LAW_DSSM_WITH_TRASH”
Name: “FinLawDssmWithTrash”
Ticket: “SENS-177”
Authors: [“hygge”, “alejes”, “anrodigina”, “hommforever”, “nenashevna”]
Responsibles: [“hygge”, “alejes”]
Description: “Prediction fin_law_with_trash.dssm (Fin-law document model with trash added to lern) model by url + title.”
MinValue: -2.0
MaxValue: 2.0
Tags: [TG_L2, TG_NEURAL, TG_URL_TEXT, TG_STATIC, TG_UNUSED, TG_NOT_01, TG_USED_IN_CONF_REARR]
}
Factor {
Index: 873
CppName: “FI_FIO_FROM_ORIGINAL_REQUEST_BODY_MIN_WINDOW_SIZE”
Name: “FioFromOriginalRequestBodyMinWindowSize”
Ticket: “SEARCHSPEC-94”
Description: “Factor by full name from the original request Considered by the content of the document. The minimum size of the window, which includes all the words of the request. Normalized by the number of words in the request.”
Tags: [TG_DOC, TG_DOC_TEXT, TG_UNDOCUMENTED, TG_TEXT_MACHINE]
ImplementationTime: “2021-08-30”
}
Factor {
Index: 874
CppName: “FI_FIO_FROM_ORIGINAL_REQUEST_TEXT_COSINE_MATCH_MAX_PREDICTION”
Name: “FioFromOriginalRequestTextCosineMatchMaxPrediction”
Ticket: “SEARCHSPEC-94”
Description: “Factor by full name from original request Document text. Algorithm CosineMatchMaxPrediction.”
Tags: [TG_DOC, TG_DOC_TEXT, TG_UNDOCUMENTED, TG_UNIMPLEMENTED, TG_TEXT_MACHINE]
}
Factor {
Index: 875
CppName: “FI_ALL_FIO_FROM_ORIGINAL_REQUEST_ALL_MAX_F_BODY_CHAIN0_WCM”
Name: “AllFioFromOriginalRequestAllMaxFBodyChain0Wcm”
Ticket: “SEARCHSPEC-94”
Description: “Factor by all full names from the original request Aggregation by all extensions. Aggregation type by extensions: the largest value of the factor; Calculated by the document content. Algorithm: Chain0Wcm”
Tags: [TG_DOC, TG_DOC_TEXT, TG_UNDOCUMENTED, TG_UNIMPLEMENTED, TG_TEXT_MACHINE]
}
Factor {
Index: 876
CppName: “FI_ALL_FIO_FROM_ORIGINAL_REQUEST_ALL_MAX_F_BODY_MIN_WINDOW_SIZE”
Name: “AllFioFromOriginalRequestAllMaxFBodyMinWindowSize”
Ticket: “SEARCHSPEC-94”
Description: “Factor by all full names from the original request Aggregation by all extensions. Type of aggregation by extensions: the largest value of the factor; Calculated by the content of the document. The minimum size of the window that includes all the words of the query. Normalized by the number of words in the query.”
Tags: [TG_DOC, TG_DOC_TEXT, TG_UNDOCUMENTED, TG_UNIMPLEMENTED, TG_TEXT_MACHINE]
}
Factor {
Index: 877
CppName: “FI_SP_AVG_CLICK_FRC_SYN_REG”
Name: “SamplePeriodClickFrcSyn”
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_SYNNORM, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_SAMPLE_PERIOD, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_USF_SAMPLE_PERIOD, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Description: “Share of URLs in the total number of URLs clicked per session for a query (synnorm).”
Authors: “monnoroch”
Responsibles: [“monnoroch”, “alsafr”, “tarum”, “niknik”]
Wiki: “https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/sampleperiod”
Ticket: “FACTOR-442”
}
Factor {
Index: 878
CppName: “FI_SP_AVG_TOTAL_FRC_SYN_REG”
Name: “SamplePeriodDayFrcSyn”
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_SYNNORM, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_SAMPLE_PERIOD, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_USF_SAMPLE_PERIOD, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Description: “The average share of clicks on this URL for this query among all clicks on this query (synnorm) during the day.”
Authors: “monnoroch”
Responsibles: [“monnoroch”, “alsafr”, “tarum”, “niknik”]
Wiki: “https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/sampleperiod”
Ticket: “FACTOR-442”
}
Factor {
Index: 879
CppName: “FI_SP_AVG_TOTAL_FRC_REG”
Name: “SamplePeriodDayFrc”
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_L2, TG_SAMOHOD_UNIMPLEMENTED, TG_CALLISTO_UNIMPLEMENTED, TG_USERFEAT, TG_USERFEAT_SAMPLE_PERIOD, TG_NN_OVER_FEATURES_USE, TG_USERFEAT_USF_SAMPLE_PERIOD, TG_FORMULA_2245_DEP_3, TG_DEPRECATED]
Description: “The average share of clicks on this URL for this query among all clicks on this query (qnorm) during the day.”
Authors: “monnoroch”
Responsibles: [“monnoroch”, “alsafr”, “tarum”, “niknik”]
Wiki: “https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/sampleperiod”
Ticket: “FACTOR-442”
}
Factor {
Index: 880
CppName: “FI_QI_QUERY_URL_CORRECTED_CTR_XFACTOR”
Name: “QiQueryUrlCorrectedCtrXfactor”
Group: “QI”
Ticket: “FACTOR-306”
Wiki: “https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/qiuserdata”
Tags: [TG_DYNAMIC, TG_DOC, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_LOCALIZED_COUNTRY, TG_USER_EXT_DATA, TG_COLLABORATED, TG_USER, TG_L2, TG_DEPRECATED, TG_REMOVED]
Countries: [CNT_ALL, CNT_TR]
Description: “QI version of factor 861. MaxValue over the set of popular similar queries.”
Authors: “tsimkha”
Responsibles: [“smikler”, “tsimkha”]
}
Factor {
Index: 881
CppName: “FI_QI_QUERY_URL_ISBM_CTR_REG”
Name: “QiQueryURLISBMCTRReg”
Group: “QI”
Wiki: “https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/qiuserdata”
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_REGION, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_L2, TG_DEPRECATED]
Ticket: “FACTOR-306”
Description: “QI version of factor 798. MaxValue over the set of popular similar queries.”
Authors: “tsimkha”
Responsibles: [“smikler”, “tsimkha”]
}
Factor {
Index: 882
CppName: “FI_ALL_FIO_FROM_ORIGINAL_REQUEST_ALL_MAX_F_TEXT_COSINE_MATCH_MAX_PREDICTION”
Name: “AllFioFromOriginalRequestAllMaxFTextCosineMatchMaxPrediction”
Ticket: “SEARCHSPEC-94”
Description: “Factor by all full names from the original request. Aggregation by all extensions. Aggregation type by extensions: highest factor value; Document text. CosineMatchMaxPrediction algorithm.”
Tags: [TG_DOC, TG_DOC_TEXT, TG_UNDOCUMENTED, TG_UNIMPLEMENTED, TG_TEXT_MACHINE]
}
Factor {
Index: 883
CppName: “FI_DSSM_PAGE_QUALITY”
Name: “DssmPageQuality”
Ticket: “SEARCH-11378, SEARCHSPEC-172”
Authors: [“jullak”]
Responsibles: [“nenashevna”, “hommforever”, “jullak”]
Description: “Dssm predicting the page quality score for a document”
Tags: [TG_DEPRECATED, TG_NEURAL, TG_STATIC, TG_URL_TEXT, TG_DOC]
ImplementationTime: “2021-11-25”
}
Factor {
Index: 884
CppName: “FI_HAS_TURBO_ECOM”
Name: “HasTurboEcom”
Tags: [TG_DOC, TG_STATIC, TG_BINARY, TG_OFTEN_ZERO, TG_META_OVERWRITE, TG_UNUSED, TG_DATA_FROM_SAASKV, TG_UNIMPLEMENTED]
Ticket: “SEARCHSPAM-15910”
Authors: [“bikulov”]
Responsibles: [“bikulov”, “ulyanov”]
}
Factor {
Index: 885
CppName: “FI_MEMORANDUM_URL_TYPE”
Name: “MemorandumUrlType”
Tags: [TG_DOC, TG_STATIC, TG_OFTEN_ZERO, TG_UNUSED, TG_UNIMPLEMENTED]
Ticket: “CONTENTQUALITY-169”
Authors: [“makkolts”]
Responsibles: [“makkolts”, “sdormidontov”]
}
Factor {
Index: 886
CppName: “FI_SP_AVG_TOTAL_FRC_XFACTOR_REG”
Name: “SamplePeriodDayFrcXfactor”
Ticket: “FACTOR-506”
Wiki: “https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/sampleperiodXfactor”
Tags: [TG_DYNAMIC, TG_DOC, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_LOCALIZED_COUNTRY, TG_COLLABORATED, TG_USER, TG_L2, TG_DEPRECATED, TG_REMOVED]
Countries: [CNT_EN]
Description: “Request-url factor. Value is the result of collaborative data filtering for the SamplePeriodDayFrc factor”
Authors: [“avatar”, “monnoroch”, “alsafr”]
Responsibles: [“avatar”, “monnoroch”]
}
Factor {
Index: 887
CppName: “FI_FAST_FILTER_MATRIX_NET”
Name: “FastFilterMatrixNet”
Tags: [TG_DOC, TG_DYNAMIC, TG_UNUSED, TG_TRANS]
Ticket: “SAAS-5758”
Authors: [“one million”]
Responsibles: [“one million”]
Description: “The MatrixNet value of the fast filtering model.”
}
Factor {
Index: 888
CppName: “FI_FAST_FILTER_POLYNOM”
Name: “FastFilterPolynom”
Tags: [TG_DOC, TG_DYNAMIC, TG_UNUSED, TG_TRANS]
Ticket: “SAAS-5758”
Authors: [“one million”]
Responsibles: [“one million”]
Description: “The Polynom value of the fast filtering ranking model.”
}
Factor {
Index: 889
CppName: “FI_QI_SP_AVG_TOTAL_FRC_REG”
Name: “QiSamplePeriodDayFrc”
Group: “QI”
Wiki: “https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/sampleperiod”
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_REGION, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_USER_EXT_DATA, TG_L2, TG_DEPRECATED]
Ticket: “FACTOR-442”
Description: “QI version of factor 879.”
Authors: “monnoroch”
Responsibles: [“monnoroch”, “tsimkha”]
}
Factor {
Index: 890
CppName: “FI_META_MATRIX_NET”
Name: “MetaMatrixNet”
Tags: [TG_DOC, TG_DYNAMIC, TG_TRANS, TG_UNUSED]
Ticket: “SAASSUP-3741”
Authors: [“one million”]
Responsibles: [“one million”]
Description: “Meta MatrixNet value.”
}
Factor {
Index: 891
CppName: “FI_META_POLYNOM”
Name: “MetaPolynom”
Tags: [TG_DOC, TG_DYNAMIC, TG_TRANS, TG_UNUSED]
Ticket: “SAASSUP-3741”
Authors: [“one million”]
Responsibles: [“one million”]
Description: “Meta Polynom value.”
}
Factor {
Index: 892
CppName: “FI_SHORT_VIDEO”
Name: “ShortVideo”
Tags: [TG_DOC, TG_STATIC, TG_URL_TEXT, TG_BINARY, TG_OFTEN_ZERO, TG_L2, TG_UNUSED, TG_UNIMPLEMENTED]
Ticket: “SEARCHPLAY-24”
Authors: [“bbetrozova”]
Responsibles: [“bbetrozova”, “alejes”]
Description: “A document is a short video (tiktok, reels, shorts).”
}
Factor {
Index: 893
CppName: “FI_TELEGRAM_CHANNEL_WEB”
Name: “TelegramChannelWebFormat”
Tags: [TG_DOC, TG_STATIC, TG_URL_TEXT, TG_BINARY, TG_OFTEN_ZERO, TG_L2, TG_UNUSED, TG_UNIMPLEMENTED]
Ticket: “SEARCHPLAY-49”
Authors: [“bbetrozova”]
Responsibles: [“bbetrozova”, “alejes”]
Description: “Document – telegram channel in web format.”
}
Factor {
Index: 894
CppName: “FI_TELEGRAM_POST”
Name: “TelegramPost”
Tags: [TG_DOC, TG_STATIC, TG_URL_TEXT, TG_BINARY, TG_OFTEN_ZERO, TG_L2, TG_UNUSED, TG_UNIMPLEMENTED]
Ticket: “SEARCHPLAY-49”
Authors: [“bbetrozova”]
Responsibles: [“bbetrozova”, “alejes”]
Description: “Document – a post in a telegram.”
}
Factor {
Index: 895
CppName: “FI_CORRECTED_CTR_ANNOTATION_MATCH_PREDICTION”
Name: “CorrectedCtrAnnotationMatchPrediction”
Ticket: “FACTOR-468”
Group: “Annotation”
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_FILTER, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_1832D, TG_USERFEAT_SEARCH_DWELL_TIME, TG_USERFEAT_USF, TG_FORMULA_2245_DEP_2, TG_DEPRECATED]
Description: “CorrectedCtrReg factor in annotation index, AnnotationMatchPrediction factor”
Authors: [“alsafr”, “smikler”]
Responsibles: “smikler”
}
Factor {
Index: 896
CppName: “FI_CORRECTED_CTR_QUERY_MATCH_PREDICTION”
Name: “CorrectedCtrQueryMatchPrediction”
Ticket: “FACTOR-468”
Group: “Annotation”
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_FILTER, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_1832D, TG_USERFEAT_SEARCH_DWELL_TIME, TG_USERFEAT_USF, TG_FORMULA_2245_DEP_2, TG_DEPRECATED]
Description: “CorrectedCtrReg factor in annotation index, QueryMatchPrediction factor”
Authors: [“alsafr”, “smikler”]
Responsibles: “smikler”
}
Factor {
Index: 897
CppName: “FI_CORRECTED_CTR_VALUE_WCM_AVG”
Name: “CorrectedCtrValueWcmAvg”
Ticket: “FACTOR-468”
Group: “Annotation”
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_FILTER, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_1832D, TG_USERFEAT_SEARCH_DWELL_TIME, TG_USERFEAT_USF, TG_FORMULA_2245_DEP_2, TG_DEPRECATED]
Description: “CorrectedCtrReg factor in annotation index, factor ValueWcmAvg”
Authors: [“alsafr”, “smikler”]
Responsibles: “smikler”
}
Factor {
Index: 898
CppName: “FI_CORRECTED_CTR_BM15_V4_K5”
Name: “CorrectedCtrBm15V4K5”
Ticket: “FACTOR-468”
Group: “Annotation”
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_FILTER, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_1832D, TG_USERFEAT_SEARCH_DWELL_TIME, TG_USERFEAT_USF, TG_FORMULA_2245_DEP_2, TG_DEPRECATED]
Description: “CorrectedCtrReg factor in annotation index, factor Bm15V4K5”
Authors: [“alsafr”, “smikler”]
Responsibles: “smikler”
}
Factor {
Index: 899
CppName: “FI_IS_NOT_CGI”
Name: “IsNotCgi”
Ticket: “FACTOR-575”
Tags: [TG_STATIC, TG_URL_TEXT, TG_DOC, TG_L2, TG_NN_OVER_FEATURES_USE]
Description: “Factor about the presence of the character ‘?’ in the url. It is equal to zero if the url has cgi-parameters (more precisely: all duplicates have a ‘?’ symbol in the url).”
Authors: “ilnurkh”
Responsibles: “ilnurkh”
}
Factor {
Index: 900
CppName: “FI_ALICE_CLICK_DSSM”
Name: “AliceClickDssm”
Tags: [TG_DYNAMIC, TG_DOC, TG_USER, TG_USER_SEARCH, TG_URL_TEXT, TG_DOC_TEXT, TG_DOC_CONTENT, TG_NEURAL, TG_UNDOCUMENTED, TG_UNUSED, TG_ALICE_MUSIC, TG_RTMODELS_SERVICE, TG_ALLOW_USE_FOR_ALICE]
Description: “DSSM click prediction based on Alice-specific data”
Ticket: “SEARCHSPEC-132”
Authors: “an-to-nen-ko”
Responsibles: “an-to-nen-ko”
ImplementationTime: “2021-11-27”
}
Factor {
Index: 901
CppName: “FI_TEL_FULL_ATTRIBUTE_TEXT_BOCM15_K001”
Name: “TelFullAttributeTextBocm15K001”
Ticket: “SEARCHPLAY-70”
Description: “Factor by telephone attributes tel_full from the original request Document text. Bocm15 word weight aggregation algorithm. Normalization coefficient 0.01.”
Tags: [TG_DOC, TG_DOC_TEXT, TG_TEXT_MACHINE, TG_UNDOCUMENTED, TG_DYNAMIC]
Authors: “ilnurkh”
Responsibles: “ilnurkh”
ImplementationTime: “2022-02-09”
}
Factor {
Index: 902
CppName: “FI_REMOVED_902”
Name: “Removed_902”
Tags: [TG_REMOVED]
}
Factor {
Index: 903
CppName: “FI_SAMPLE_PERIOD_DAY_FRC_QUERY_MATCH_PREDICTION”
Name: “SamplePeriodDayFrcQueryMatchPrediction”
Ticket: “FACTOR-605”
Wiki: “https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/sampleperiod”
Group: “Annotation”
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: “SamplePeriodDayFrc factor in annotation index, QueryMatchPrediction factor”
Authors: “pavelgur”
Responsibles: [“smikler”, “yustuken”, “diver”]
}
Factor {
Index: 904
CppName: “FI_SAMPLE_PERIOD_DAY_FRC_ANNOTATION_MATCH_PREDICTION”
Name: “SamplePeriodDayFrcAnnotationMatchPrediction”
Ticket: “FACTOR-605”
Wiki: “https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/sampleperiod”
Group: “Annotation”
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: “SamplePeriodDayFrc factor in annotation index, AnnotationMatchPrediction factor”
Authors: “pavelgur”
Responsibles: [“smikler”, “yustuken”, “diver”]
}
Factor {
Index: 905
CppName: “FI_ONE_CLICK_QUERY_MATCH_PREDICTION”
Name: “OneClickQueryMatchPrediction”
Group: “Annotation”
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: “OneClick factor in annotation index, QueryMatchPrediction factor”
Authors: [“alsafr”, “pavelgur”]
Responsibles: [“smikler”, “yustuken”, “diver”]
}
Factor {
Index: 906
CppName: “FI_ONE_CLICK_ANNOTATION_MATCH_PREDICTION”
Name: “OneClickAnnotationMatchPrediction”
Group: “Annotation”
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: “OneClick factor in annotation index, AnnotationMatchPrediction factor”
Authors: [“alsafr”, “pavelgur”]
Responsibles: [“smikler”, “yustuken”, “diver”]
}
Factor {
Index: 907
CppName: “FI_ONE_CLICK_BM15_AK4”
Name: “OneClickBm15AK4”
Group: “Annotation”
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: “OneClick factor in annotation index, factor Bm15AK4”
Authors: [“alsafr”, “pavelgur”]
Responsibles: [“smikler”, “yustuken”, “diver”]
}
Factor {
Index: 908
CppName: “FI_ONE_CLICK_BOCM_WEIGHTED_W1K3”
Name: “OneClickBocmWeightedW1K3”
Group: “Annotation”
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: “OneClick factor in annotation index, factor BocmWeightedW1K3”
Authors: [“alsafr”, “pavelgur”]
Responsibles: [“smikler”, “yustuken”, “diver”]
}
Factor {
Index: 909
CppName: “FI_LONG_CLICK_QUERY_MATCH_PREDICTION”
Name: “LongClickQueryMatchPrediction”
Group: “Annotation”
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: “LongClick factor in annotation index, QueryMatchPrediction factor”
Authors: “pavelgur”
Responsibles: [“smikler”, “yustuken”, “diver”]
}
Factor {
Index: 910
CppName: “FI_LONG_CLICK_ANNOTATION_MATCH_PREDICTION”
Name: “LongClickAnnotationMatchPrediction”
Group: “Annotation”
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: “LongClick factor in annotation index, AnnotationMatchPrediction factor”
Authors: “pavelgur”
Responsibles: [“smikler”, “yustuken”, “diver”]
}
Factor {
Index: 911
CppName: “FI_LONG_CLICK_BM15_AK4”
Name: “LongClickBm15AK4”
Group: “Annotation”
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: “LongClick factor in annotation index, factor Bm15AK4”
Authors: “pavelgur”
Responsibles: [“smikler”, “yustuken”, “diver”]
}
Factor {
Index: 912
CppName: “FI_LONG_CLICK_BOCM_WEIGHTED_W1K3”
Name: “LongClickBocmWeightedW1K3”
Group: “Annotation”
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: “LongClick factor in annotation index, factor BocmWeightedW1K3”
Authors: “pavelgur”
Responsibles: [“smikler”, “yustuken”, “diver”]
}
Factor {
Index: 913
CppName: “FI_SPLIT_DWELL_TIME_QUERY_MATCH_PREDICTION”
Name: “SplitDwellTimeQueryMatchPrediction”
Group: “Annotation”
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: “SplitDwellTime factor in annotation index, factor QueryMatchPrediction”
Authors: “pavelgur”
Responsibles: [“smikler”, “yustuken”, “diver”]
}
Factor {
Index: 914
CppName: “FI_SPLIT_DWELL_TIME_ANNOTATION_MATCH_PREDICTION”
Name: “SplitDwellTimeAnnotationMatchPrediction”
Group: “Annotation”
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: “SplitDwellTime factor in annotation index, AnnotationMatchPrediction factor”
Authors: “pavelgur”
Responsibles: [“smikler”, “yustuken”, “diver”]
}
Factor {
Index: 915
CppName: “FI_BQPR_QUERY_MATCH_PREDICTION”
Name: “BQPRQueryMatchPrediction”
Group: “Annotation”
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_BROWSER, TG_USER_EXT_DATA, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: “BQPR factor in annotation index, QueryMatchPrediction factor”
Authors: “smikler”
Responsibles: [“smikler”, “yustuken”, “diver”]
}
Factor {
Index: 916
CppName: “FI_BQPR_ANNOTATION_MATCH_PREDICTION”
Name: “BQPRAnnotationMatchPrediction”
Group: “Annotation”
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_BROWSER, TG_USER_EXT_DATA, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: “BQPR factor in annotation index, AnnotationMatchPrediction factor”
Authors: “smikler”
Responsibles: [“smikler”, “yustuken”, “diver”]
}
Factor {
Index: 917
CppName: “FI_YABAR_VISITS_QUERY_MATCH_PREDICTION”
Name: “YabarVisitsQueryMatchPrediction”
Group: “Annotation”
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_BROWSER, TG_USER_EXT_DATA, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: “YabarVisits factor in annotation index, factor QueryMatchPrediction”
Authors: [“akhropov”, “ilnurkh”]
Responsibles: [“smikler”, “yustuken”, “diver”]
}
Factor {
Index: 918
CppName: “FI_YABAR_VISITS_ANNOTATION_MATCH_PREDICTION”
Name: “YabarVisitsAnnotationMatchPrediction”
Group: “Annotation”
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_BROWSER, TG_USER_EXT_DATA, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: “YabarVisits factor in annotation index, factor AnnotationMatchPrediction”
Authors: [“akhropov”, “ilnurkh”]
Responsibles: [“smikler”, “yustuken”, “diver”]
}
Factor {
Index: 919
CppName: “FI_YABAR_TIME_QUERY_MATCH_PREDICTION”
Name: “YabarTimeQueryMatchPrediction”
Group: “Annotation”
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_BROWSER, TG_USER_EXT_DATA, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: “YabarTime factor in annotation index, QueryMatchPrediction factor”
Authors: [“akhropov”, “ilnurkh”]
Responsibles: [“smikler”, “yustuken”, “diver”]
}
Factor {
Index: 920
CppName: “FI_YABAR_TIME_ANNOTATION_MATCH_PREDICTION”
Name: “YabarTimeAnnotationMatchPrediction”
Group: “Annotation”
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_BROWSER, TG_USER_EXT_DATA, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: “YabarTime factor in annotation index, AnnotationMatchPrediction factor”
Authors: [“akhropov”, “ilnurkh”]
Responsibles: [“smikler”, “yustuken”, “diver”]
}
Factor {
Index: 921
CppName: “FI_SIMPLE_CLICK_QUERY_MATCH_PREDICTION”
Name: “SimpleClickQueryMatchPrediction”
Group: “Annotation”
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: “SimpleClick factor in annotation index, QueryMatchPrediction factor”
Authors: “monnoroch”
Responsibles: [“smikler”, “yustuken”, “diver”]
}
Factor {
Index: 922
CppName: “FI_SIMPLE_CLICK_ANNOTATION_MATCH_PREDICTION”
Name: “SimpleClickAnnotationMatchPrediction”
Group: “Annotation”
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: “SimpleClick factor in annotation index, AnnotationMatchPrediction factor”
Authors: “monnoroch”
Responsibles: [“smikler”, “yustuken”, “diver”]
}
Factor {
Index: 923
CppName: “FI_LONG_CLICK_BOCM_PLAIN”
Name: “LongClickBocmPlain”
Group: “Annotation”
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: “LongClick factor in annotation index, BocmPlain factor”
Authors: “pavelgur”
Responsibles: [“smikler”, “yustuken”, “diver”]
}
Factor {
Index: 924
CppName: “FI_RANDOM_LOG_DBM35_XFACTOR_FULL_MATCH_PREDICTION”
Name: “RandomLogDBM35XfactorFullMatchPrediction”
Ticket: “FACTOR-579”
Wiki: “https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/RandomLogDBM35”
Group: “Annotation”
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED, TG_COLLABORATED, TG_REMOVED]
Countries: [CNT_TR]
Description: “Result of collaborative filtering for factor FI_DBM35 from random log in annotation index, factor FullMatchPrediction”
Authors: [“avatar”, “alsafr”, “akhropov”]
Responsibles: [“smikler”, “yustuken”, “diver”]
}
Factor {
Index: 925
CppName: “FI_RANDOM_LOG_DBM35_XFACTOR_ANNOTATION_MATCH_PREDICTION”
Name: “RandomLogDBM35XfactorAnnotationMatchPrediction”
Ticket: “FACTOR-579”
Wiki: “https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/RandomLogDBM35”
Group: “Annotation”
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED, TG_COLLABORATED, TG_REMOVED]
Countries: [CNT_TR]
Description: “Result of collaborative filtering for factor FI_DBM35 from random log in annotation index, factor AnnotationMatchPrediction”
Authors: [“avatar”, “alsafr”, “akhropov”]
Responsibles: [“smikler”, “yustuken”, “diver”]
}
Factor {
Index: 926
CppName: “FI_ONE_CLICK_SYNONYM_MATCH_PREDICTION”
Name: “OneClickSynonymMatchPrediction”
Group: “Annotation”
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: “OneClick factor in annotation index, SynonymMatchPrediction factor”
Authors: [“alsafr”, “pavelgur”]
Responsibles: [“smikler”, “yustuken”, “diver”]
}
Factor {
Index: 927
CppName: “FI_ONE_CLICK_FULL_MATCH_PREDICTION”
Name: “OneClickFullMatchPrediction”
Group: “Annotation”
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: “OneClick factor in annotation index, FullMatchPrediction factor”
Authors: [“alsafr”, “pavelgur”]
Responsibles: [“smikler”, “yustuken”, “diver”]
}
Factor {
Index: 928
CppName: “FI_ONE_CLICK_VALUE_WCM_AVG”
Name: “OneClickValueWcmAvg”
Group: “Annotation”
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: “OneClick factor in annotation index, factor ValueWcmAvg”
Authors: [“alsafr”, “pavelgur”]
Responsibles: [“smikler”, “yustuken”, “diver”]
}
Factor {
Index: 929
CppName: “FI_ONE_CLICK_BOCM_WEIGHTED_MAX_K1”
Name: “OneClickBocmWeightedMaxK1”
Group: “Annotation”
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: “OneClick factor in annotation index, factor BocmWeightedMaxK1”
Authors: [“alsafr”, “pavelgur”]
Responsibles: [“smikler”, “yustuken”, “diver”]
}
Factor {
Index: 930
CppName: “FI_ONE_CLICK_BM15_STRICT_K2”
Name: “OneClickBm15StrictK2”
Group: “Annotation”
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: “OneClick factor in annotation index, Bm15StrictK2 factor”
Authors: [“alsafr”, “pavelgur”]
Responsibles: [“smikler”, “yustuken”, “diver”]
}
Factor {
Index: 931
CppName: “FI_ONE_CLICK_BM15_MAX_K3”
Name: “OneClickBm15MaxK3”
Group: “Annotation”
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: “OneClick factor in annotation index, Bm15MaxK3 factor”
Authors: [“alsafr”, “pavelgur”]
Responsibles: [“smikler”, “yustuken”, “diver”]
}
Factor {
Index: 932
CppName: “FI_ONE_CLICK_BCLM_PLAIN_W1K3”
Name: “OneClickBclmPlainW1K3”
Group: “Annotation”
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: “OneClick factor in annotation index, BclmPlainW1K3 factor”
Authors: [“alsafr”, “pavelgur”]
Responsibles: [“smikler”, “yustuken”, “diver”]
}
Factor {
Index: 933
CppName: “FI_ONE_CLICK_VALUE_WCM_MAX”
Name: “OneClickValueWcmMax”
Group: “Annotation”
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: “OneClick factor in annotation index, factor ValueWcmMax”
Authors: [“alsafr”, “pavelgur”]
Responsibles: [“smikler”, “yustuken”, “diver”]
}
Factor {
Index: 934
CppName: “FI_ONE_CLICK_VALUE_WCM_PREDICTION”
Name: “OneClickValueWcmPrediction”
Group: “Annotation”
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: “OneClick factor in annotation index, factor ValueWcmPrediction”
Authors: [“alsafr”, “pavelgur”]
Responsibles: [“smikler”, “yustuken”, “diver”]
}
Factor {
Index: 935
CppName: “FI_ONE_CLICK_BCLM_WEIGHTED_K3”
Name: “OneClickBclmWeightedK3”
Group: “Annotation”
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: “OneClick factor in annotation index, BclmWeightedK3 factor”
Authors: [“alsafr”, “pavelgur”]
Responsibles: [“smikler”, “yustuken”, “diver”]
}
Factor {
Index: 936
CppName: “FI_BQPR_BOCM_WEIGHTED_W1_K3”
Name: “BQPRBocmWeightedW1K3”
Group: “Annotation”
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_BROWSER, TG_USER_EXT_DATA, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: “BQPR factor in annotation index, BocmWeightedW1K3 factor”
Authors: “smikler”
Responsibles: [“smikler”, “yustuken”, “diver”]
}
Factor {
Index: 937
CppName: “FI_BQPR_BM15_STRICT_K2”
Name: “BQPRBm15StrictK2”
Group: “Annotation”
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_BROWSER, TG_USER_EXT_DATA, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: “BQPR factor in annotation index, factor Bm15StrictK2”
Authors: “smikler”
Responsibles: [“smikler”, “yustuken”, “diver”]
}
Factor {
Index: 938
CppName: “FI_SPLIT_DWELL_BOCM_WEIGHTED_MAX_K1”
Name: “SplitDwellTimeBocmWeightedMaxK1”
Group: “Annotation”
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: “SplitDwellTime factor in annotation index, factor BocmWeightedMaxK1”
Authors: “pavelgur”
Responsibles: [“smikler”, “yustuken”, “diver”]
}
Factor {
Index: 939
CppName: “FI_SPLIT_DWELL_TIME_FULL_MATCH_PREDICTION”
Name: “SplitDwellTimeFullMatchPrediction”
Group: “Annotation”
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: “SplitDwellTime factor in annotation index, FullMatchPrediction factor”
Authors: “pavelgur”
Responsibles: [“smikler”, “yustuken”, “diver”]
}
Factor {
Index: 940
CppName: “FI_SPLIT_DWELL_TIME_VALUE_WCM_AVG”
Name: “SplitDwellTimeValueWcmAvg”
Group: “Annotation”
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED]
Description: “SplitDwellTime factor in annotation index, factor ValueWcmAvg”
Authors: “pavelgur”
Responsibles: [“smikler”, “yustuken”, “diver”]
}
Factor {
Index: 941
CppName: “FI_CORRECTED_CTR_BM15_STRICT_K2”
Name: “CorrectedCtrBm15StrictK2”
Ticket: “FACTOR-468”
Group: “Annotation”
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_FILTER, TG_NN_OVER_FEATURES_USE, TG_USERFEAT, TG_USERFEAT_1832D, TG_USERFEAT_SEARCH_DWELL_TIME, TG_USERFEAT_USF, TG_FORMULA_2245_DEP_2, TG_DEPRECATED]
Description: “CorrectedCtrReg factor in annotation index, factor Bm15StrictK2”
Authors: [“alsafr”, “smikler”]
Responsibles: [“smikler”, “yustuken”, “diver”]
}
Factor {
Index: 942
CppName: “FI_FRACTION_OF_QUERIES_WITH_GEO_PREDICTION”
Name: “FractionOfQueriesWithGeoPredicted”
DependsOn: [{Feature: [“FractionOfQueriesWithGeoPredicted”], Slice: “begemot_query_factors”}]
Ticket: “FACTOR-508”
Group: “Query”
Tags: [TG_QUERY_ONLY, TG_USER_SEARCH, TG_LOCALIZED_COUNTRY, TG_DYNAMIC, TG_L2, TG_DEPRECATED]
Countries: [CNT_ALL]
Description: “Predict the share of queries with geography from the bag of words built for the query”
Authors: [“yazevnul”]
Responsibles: [“yazevnul”, “esoloviev”]
}
Factor {
Index: 943
CppName: “FI_URL_IS_EXACT”
Name: “IsExactUrl”
DependsOn: [{Feature: [“IsExactUrl”], Slice: “begemot_query_factors”}]
Tags: [TG_BINARY, TG_DYNAMIC, TG_QUERY_ONLY, TG_OFTEN_ZERO, TG_L2, TG_DEPRECATED]
Description: “The request is a url up to dots and spaces – the isurl wizard rule is used”
Ticket: “FACTOR-682”
Authors: [“mbusel”, “smikler”]
Responsibles: “mbusel”
}
Factor {
Index: 944
CppName: “FI_RANDOM_LOG_DBM35_XFACTOR_VALUE_WCM_MAX”
Name: “RandomLogDBM35XfactorValueWcmMax”
Ticket: “FACTOR-579”
Wiki: “https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/RandomLogDBM35”
Group: “Annotation”
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED, TG_COLLABORATED, TG_REMOVED]
Countries: [CNT_TR]
Description: “Result of collaborative filtering for factor FI_DBM35 from random log in annotation index, factor ValueWcmMax”
Authors: [“avatar”, “alsafr”, “akhropov”]
Responsibles: [“smikler”, “yustuken”, “diver”]
}
Factor {
Index: 945
CppName: “FI_RANDOM_LOG_DBM35_XFACTOR_VALUE_WCM_AVG”
Name: “RandomLogDBM35XfactorValueWcmAvg”
Ticket: “FACTOR-579”
Wiki: “https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/RandomLogDBM35”
Group: “Annotation”
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED, TG_COLLABORATED, TG_REMOVED]
Countries: [CNT_TR]
Description: “Result of collaborative filtering for factor FI_DBM35 from random log in annotation index, factor ValueWcmAvg”
Authors: [“avatar”, “alsafr”, “akhropov”]
Responsibles: [“smikler”, “yustuken”, “diver”]
}
Factor {
Index: 946
CppName: “FI_RANDOM_LOG_DBM35_XFACTOR_BM15_STRICK_K2”
Name: “RandomLogDBM35XfactorBm15StrictK2”
Ticket: “FACTOR-579”
Wiki: “https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/RandomLogDBM35”
Group: “Annotation”
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED, TG_COLLABORATED, TG_REMOVED]
Countries: [CNT_TR]
Description: “Result of collaborative filtering for factor FI_DBM35 from random log in annotation index, factor Bm15StrictK2”
Authors: [“avatar”, “alsafr”, “akhropov”]
Responsibles: [“smikler”, “yustuken”, “diver”]
}
Factor {
Index: 947
CppName: “FI_RANDOM_LOG_DBM35_XFACTOR_BCLM_PLAIN_W1_k3”
Name: “RandomLogDBM35XfactorBclmPlainW1K3”
Ticket: “FACTOR-579”
Wiki: “https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/RandomLogDBM35”
Group: “Annotation”
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED, TG_COLLABORATED, TG_REMOVED]
Countries: [CNT_TR]
Description: “Result of collaborative filtering for factor FI_DBM35 from random log in annotation index, factor BclmPlainW1K3”
Authors: [“avatar”, “alsafr”, “akhropov”]
Responsibles: [“smikler”, “yustuken”, “diver”]
}
Factor {
Index: 948
CppName: “FI_RANDOM_LOG_DBM35_XFACTOR_BCLM_WEIGHTED_K3”
Name: “RandomLogDBM35XfactorBclmWeightedK3”
Ticket: “FACTOR-579”
Wiki: “https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/RandomLogDBM35”
Group: “Annotation”
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED, TG_COLLABORATED, TG_REMOVED]
Countries: [CNT_TR]
Description: “Result of collaborative filtering for factor FI_DBM35 from random log in annotation index, factor BclmWeightedK3”
Authors: [“avatar”, “alsafr”, “akhropov”]
Responsibles: [“smikler”, “yustuken”, “diver”]
}
Factor {
Index: 949
CppName: “FI_RANDOM_LOG_DBM35_XFACTOR_BOCM_WEIGHTED_K3”
Name: “RandomLogDBM35XfactorBocmWeightedW1K3”
Ticket: “FACTOR-579”
Wiki: “https://wiki.yandex-team.ru/jandekspoisk/kachestvopoiska/factordev/web/factors/RandomLogDBM35”
Group: “Annotation”
Tags: [TG_DYNAMIC, TG_DOC, TG_LOCALIZED_COUNTRY, TG_USER, TG_USER_SEARCH, TG_USER_SEARCH_ONLY, TG_ANNOTATION_NOFILTER, TG_DEPRECATED, TG_C