-
Notifications
You must be signed in to change notification settings - Fork 3
/
Copy pathcreateRankLib.php
34 lines (28 loc) · 1.12 KB
/
createRankLib.php
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
<?php
/**
* A convenience script to create a ranklib file from all labeled data using defaults
*
* Defaults:
* - expects instance of elasticsearch at `https://127.0.0.1:9243/` with index commonswiki_file
* - uses the elasticsearch featureset labeled $featureSetName
* - the ranklib file will be output to out/$featureSetName.tsv
*/
$featureSetName = 'MediaSearch_20211206';
$searchTermsWithEntitiesFile = "out/searchTermsWithEntitiesAndTitleMatch.csv";
shell_exec(
'php jobs/GenerateSearchTermsWithEntitiesFile.php ' .
' --outputFile="' . $searchTermsWithEntitiesFile . '"'
);
shell_exec(
'php jobs/GenerateFeatureQueries.php ' .
' --searchTermsWithEntitiesFile="' . $searchTermsWithEntitiesFile . '"' .
' --queryJsonGenerator="MediaSearchSignalTest\Jobs\\' . $featureSetName . '"'
);
shell_exec(
'php jobs/GenerateRanklibFile.php ' .
' --queryDir="out/ltr/" '.
' --featuresetName=' . $featureSetName . '_plain' .
' --stemmedFeaturesetName=' . $featureSetName . '_stemmed' .
' --searchIndex=commonswiki_file' .
' --searchTermsWithEntitiesFile="' . $searchTermsWithEntitiesFile . '"'
);