X-Git-Url: https://git.openstreetmap.org/nominatim.git/blobdiff_plain/f8bd4f5133903139c02b5423c93d7053215fea24..2051a84a09d4a370fa74db1ba8742e9095b842fc:/wikidata/pull_wikipedia_logs.php diff --git a/wikidata/pull_wikipedia_logs.php b/wikidata/pull_wikipedia_logs.php deleted file mode 100644 index 3e172069..00000000 --- a/wikidata/pull_wikipedia_logs.php +++ /dev/null @@ -1,79 +0,0 @@ - hour.txt'); - - $hPrevTotals = @fopen('totals.txt', 'r'); - $hDayTotals = @fopen('hour.txt', 'r'); - $hNewTotals = @fopen('newtotals.txt', 'w'); - - $sPrevKey = $sDayKey = true; - $sPrevLine = true; - $sDayLine = true; - - do { - if ($sPrevKey === $sDayKey) { - if ($sPrevLine !== true) fputs($hNewTotals, "$sPrevKey ".($iPrevValue+$iDayValue)."\n"); - $sPrevLine = true; - $sDayLine = true; - } elseif ($sDayKey !== false && ($sPrevKey > $sDayKey || $sPrevKey === false)) { - fputs($hNewTotals, "$sDayKey ".($iDayValue)."\n"); - $sDayLine = true; - } elseif ($sPrevKey !== false && ($sDayKey > $sPrevKey || $sDayKey === false)) { - fputs($hNewTotals, "$sPrevKey ".($iPrevValue)."\n"); - $sPrevLine = true; - } - - if ($sPrevLine === true) { - $sPrevLine = $hPrevTotals?fgets($hPrevTotals, 4096):false; - if ($sPrevLine !== false) { - $aPrevLine = explode(' ', $sPrevLine); - $sPrevKey = $aPrevLine[0].' '.$aPrevLine[1]; - $iPrevValue = (int)$aPrevLine[2]; - } else { - $sPrevKey = false; - $iPrevValue = 0; - } - } - - if ($sDayLine === true) { - $sDayLine = $hDayTotals?fgets($hDayTotals, 4096):false; - if ($sDayLine !== false) { - preg_match('#^([a-z]{2}) ([^ :]+) ([0-9]+) [0-9]+$#', $sDayLine, $aMatch); - $sDayKey = $aMatch[1].' '.$aMatch[2]; - $iDayValue = (int)$aMatch[3]; - } else { - $sDayKey = false; - $iDayValue = 0; - } - } - } while ($sPrevLine !== false || $sDayLine !== false); - - @fclose($hPrevTotals); - @fclose($hDayTotals); - @fclose($hNewTotals); - - @unlink('totals.txt'); - rename('newtotals.txt', 'totals.txt'); - } -} - -// Notes: -/* - gzip -dc $FILE.gz | grep -e "^en [^ :]\+ [0-9]\+" | - sed "s#\(^[a-z]\{2\}\) \([^ :]\+\) \([0-9]\+\) [0-9]\+#update wikipedia_article set hit_count = coalesce(hit_count,0) + \3 where language = '\1' - and title = catch_decode_url_part('\2');#g" | /opt/mapquest/stdbase-dev$ - cat totals.txt | sed "s#\(^[a-z]\{2\}\) \([^ ]\+\) \([0-9]\+\)\$#update entity_link set hits = s,0) + \3 where target = '\1wiki' and value = catch_decode_url_part('\2');#g" - cat totals.txt | sed "s#\(^[a-z]\{2\}\) \([^ ]\+\) \([0-9]\+\)\$#update entity_link set hits = coalesce(hits,0) + \3 where target = '\1wiki' and value = catch_decode_url_part('\2');#g" -*/