<?php | <?php |
include_once("../lib/common.inc.php"); | include_once("../lib/common.inc.php"); |
$query = 'update contractnotice set "parentCN" = null where "parentCN" = \'0\''; | $query = 'update contractnotice set "parentCN" = null where "parentCN" = \'0\''; |
$result = $conn->prepare($query); | $result = $conn->prepare($query); |
$result->execute(); | $result->execute(); |
$query = 'update contractnotice set "childCN" = null where "childCN" = \'0\''; | $query = 'update contractnotice set "childCN" = null where "childCN" = \'0\''; |
$result = $conn->prepare($query); | $result = $conn->prepare($query); |
$result->execute(); | $result->execute(); |
$query = 'select "CNID","parentCN" from contractnotice where "CNID" like \'%00_\' and "parentCN" is not null'; | $query = 'select "CNID","parentCN" from contractnotice where "CNID" like \'%00_\' and "parentCN" is not null'; |
$result = $conn->prepare($query); | $result = $conn->prepare($query); |
$result->execute(); | $result->execute(); |
foreach ($result->fetchAll() as $record) { | foreach ($result->fetchAll() as $record) { |
$oldCN = $record['CNID']; | $oldCN = $record['CNID']; |
$parentCN = substr($oldCN,0,-3); | $parentCN = substr($oldCN,0,-3); |
if ($parentCN == $record['parentCN']) { | if ($parentCN == $record['parentCN']) { |
$newCN = $parentCN . "-A". substr($oldCN,-1); | $newCN = $parentCN . "-A". substr($oldCN,-1); |
$updateresult = $conn->exec('UPDATE contractnotice SET "CNID" = | $updateresult = $conn->exec('UPDATE contractnotice SET "CNID" = |
\'' . $newCN . '\' where "CNID" = \'' . $oldCN . '\';'); | \'' . $newCN . '\' where "CNID" = \'' . $oldCN . '\';'); |
echo "$oldCN => $newCN (from parent CN $parentCN) <br>\n"; | echo "$oldCN => $newCN (from parent CN $parentCN) <br>\n"; |
} | } |
else { | else { |
echo "parent CN unexpected - $oldCN doesn't look like child of {$record['parentCN']} <br>\n"; | // echo "parent CN unexpected - $oldCN doesn't look like child of {$record['parentCN']} <br>\n"; |
} | } |
} | } |
<?php | <?php |
include_once ("../lib/common.inc.php"); | include_once ("../lib/common.inc.php"); |
$query = 'SELECT c."CNID",c."parentCN",p."childCN" FROM contractnotice as c LEFT OUTER JOIN contractnotice as p on c."parentCN" = p."CNID" | $query = 'SELECT c."CNID",c."parentCN",p."childCN" FROM contractnotice as c LEFT OUTER JOIN contractnotice as p on c."parentCN" = p."CNID" |
WHERE | WHERE |
c."parentCN" > 0 AND p."childCN" IS NULL '; | c."parentCN" IS NOT NULL AND p."childCN" IS NULL '; |
$query = $conn->prepare($query); | $query = $conn->prepare($query); |
$query->execute(); | $query->execute(); |
databaseError($conn->errorInfo()); | databaseError($conn->errorInfo()); |
foreach ($query->fetchAll() as $row) { | foreach ($query->fetchAll() as $row) { |
$conn->exec('UPDATE contractnotice SET "childCN" = \'' . | $conn->exec('UPDATE contractnotice SET "childCN" = \'' . |
$row['CNID'] . '\' where "CNID" = \'' . | $row['CNID'] . '\' where "CNID" = \'' . |
$row['parentCN'] . '\';'); | $row['parentCN'] . '\';'); |
echo 'UPDATE contractnotice SET "childCN" = \'' . | echo 'UPDATE contractnotice SET "childCN" = \'' . |
$row['CNID'] . '\' where "CNID" = \'' . | $row['CNID'] . '\' where "CNID" = \'' . |
$row['parentCN'] . '\';'; | $row['parentCN'] . '\';'; |
$errors = $conn->errorInfo(); | $errors = $conn->errorInfo(); |
if ($errors[1] == 7 || $errors[1] ==0) | if ($errors[1] == 7 || $errors[1] ==0) |
echo $row['CNID'] . " linked to parent " . $row['parentCN'] . | echo $row['CNID'] . " linked to parent " . $row['parentCN'] . |
"<br>\n"; | "<br>\n"; |
else print_r($errors); | else print_r($errors); |
} | } |
// also need to eliminate CN 100528/100529 - check for double parent CNs with no childCN, latest sequent CN id keeps childCN = 0 | // also need to eliminate CN 100528/100529 - check for double parent CNs with no childCN, latest sequent CN id keeps childCN = 0 |
$query = 'SELECT "parentCN", array_agg("CNID"), count(*) from contractnotice WHERE "parentCN" IN | $query = 'SELECT "parentCN", array_agg("CNID"), count(*) from contractnotice WHERE "parentCN" IN |
( | ( |
SELECT "parentCN" | SELECT "parentCN" |
FROM contractnotice | FROM contractnotice |
GROUP BY "parentCN" | GROUP BY "parentCN" |
HAVING COUNT(*) > 1 | HAVING COUNT(*) > 1 |
AND "parentCN" != 0 | AND "parentCN" IS NOT NULL |
) | ) |
AND "childCN" = 0 | AND "childCN" IS NULL |
GROUP BY "parentCN" having count(*) > 1'; | GROUP BY "parentCN" having count(*) > 1'; |
$query = $conn->prepare($query); | $query = $conn->prepare($query); |
$query->execute(); | $query->execute(); |
databaseError($conn->errorInfo()); | databaseError($conn->errorInfo()); |
foreach ($query->fetchAll() as $row) { | foreach ($query->fetchAll() as $row) { |
$cnids = explode(",",str_replace(Array("{","}"),"",$row['array_agg'])); | $cnids = explode(",",str_replace(Array("{","}"),"",$row['array_agg'])); |
$last_cnid = array_pop($cnids); | $last_cnid = array_pop($cnids); |
foreach ($cnids as $cnid) { | foreach ($cnids as $cnid) { |
$conn->exec('UPDATE contractnotice SET "childCN" = \'' . | $conn->exec('UPDATE contractnotice SET "childCN" = \'' . |
$last_cnid . '\' where "CNID" = \'' . | $last_cnid . '\' where "CNID" = \'' . |
$cnid . '\';'); | $cnid . '\';'); |
$errors = $conn->errorInfo(); | $errors = $conn->errorInfo(); |
if ($errors[1] == 7 || $errors[1] ==0) | if ($errors[1] == 7 || $errors[1] ==0) |
echo $cnid . " linked to latest child " . $last_cnid . | echo $cnid . " linked to latest child " . $last_cnid . |
"<br>\n"; | "<br>\n"; |
else print_r($errors); | else print_r($errors); |
} | } |
} | } |
?> | ?> |
<?php | |
date_default_timezone_set('Australia/Melbourne'); | |
$split = false; | |
function format_bytes($size) { | |
$units = array(' B', ' KB', ' MB', ' GB', ' TB'); | |
for ($i = 0; $size >= 1024 && $i < 4; $i++) $size /= 1024; | |
return round($size, 2).$units[$i]; | |
} | |
$days = 4; | |
if (isset($_REQUEST['days'])) $days = $_REQUEST['days']; | |
$startDate = strtotime("05-Jun-2008"); | |
if (isset($_REQUEST['startDate'])) $startDate = $_REQUEST['startDate']; | |
function getFile($startDate, $days, $minVal, $maxVal) { | |
global $split; | |
$endDate = strtotime(date("Y-m-d", $startDate)." +".$days." days"); | |
$file = date("dMY",$startDate).'to'.date("dMY",$endDate).'val'.$minVal.'to'.$maxVal.'.xls'; | |
echo "Fetching $file ($days days) ($minVal < value < $maxVal )... "; | |
$url = "https://www.tenders.gov.au/?event=public.advancedsearch.CNSONRedirect&type=cnEvent&atmType=archived%2Cclosed%2Cpublished%2Cproposed&agencyUUID=&agencyStatus=-1&portfolioUUID=&keyword=&KeywordTypeSearch=AllWord&CNID=&dateType=Publish+Date&dateStart=".date("d-M-Y",$startDate)."&dateEnd=".date("d-M-Y",$endDate)."&supplierName=&supplierABN=&valueFrom=".$minVal."&valueTo=".$maxVal."&ATMID=&AgencyRefId=&consultancy=&download=Download+results"; | |
echo "<!-- $url -->"; | |
$current = file_get_contents($url); | |
if (strpos($current,"There are no results that match your selection.")> 0 ) { | |
echo "<font color=red>Empty file!</font><br>"; | |
} | |
if (strpos($current,"Your search returned more than 1000 results.") === false) { | |
file_put_contents($file, $current); | |
echo "$file saved<br>"; | |
echo format_bytes(filesize($file))."<br>"; | |
echo '<a href="?startDate='.$endDate.'&days='.$days.'">Load next '.($days).' days </a><br>'; | |
echo '<a href="?startDate='.$endDate.'&days='.($days*2).'">Load next '.($days*2).' days </a><br>'; | |
echo '<a href="?startDate='.$endDate.'&days='.$days.'&split=yes">Load next '.($days).' days with split</a><br>'; | |
flush(); | |
if (!isset($_REQUEST['split']) && !$split) { | |
echo "Success so fetching next $days... <br>"; | |
getFile($endDate, $days, "" , ""); | |
} | |
return true; | |
} else { | |
echo "<font color=red>Too many records!</font><br>"; | |
echo '<a href="?startDate='.$startDate.'&days='.floor($days/2).'">Load '.($days/2).' days instead?</a><br>'; | |
echo '<a href="?startDate='.$startDate.'&days='.$days.'&split=yes">Split instead?</a><br>'; | |
flush(); | |
if (!isset($_REQUEST['split']) && !$split) { | |
echo "Failure so splitting ... <br>"; | |
doSplit($startDate, $days); | |
} | |
return false; | |
} | |
} | |
function doSplit($startDate, $days) { | |
global $split; | |
$split = true; | |
set_time_limit(20); | |
getFile($startDate, $days, 0, 12000); | |
getFile($startDate, $days, 12000, 16000); | |
getFile($startDate, $days, 16000, 20000); | |
getFile($startDate, $days, 20000, 30000); | |
getFile($startDate, $days, 30000, 40000); | |
// getFile($startDate, $days, 40000, 80000); | |
getFile($startDate, $days, 40000, 60000); | |
getFile($startDate, $days, 60000, 80000); | |
// getFile($startDate, $days, 80000, 300000); | |
getFile($startDate, $days, 80000, 150000); | |
getFile($startDate, $days, 150000, 300000); | |
getFile($startDate, $days, 300000, 999999999); | |
} | |
if (isset($_REQUEST['split'])) { | |
doSplit($startDate, $days); | |
} else { | |
getFile($startDate, $days, "" , ""); | |
} | |
?> | |
<?php | <?php |
error_reporting(E_ALL); | error_reporting(E_ALL); |
include_once("../lib/common.inc.php"); | include_once("../lib/common.inc.php"); |
$unspscresult = $conn->prepare('select * from "UNSPSCcategories";'); | $unspscresult = $conn->prepare('select * from "UNSPSCcategories";'); |
$unspscresult->execute(); | $unspscresult->execute(); |
foreach ($unspscresult->fetchAll() as $row) { | foreach ($unspscresult->fetchAll() as $row) { |
$unspsc[$row['Title']] = $row['UNSPSC']; | $unspsc[$row['Title']] = $row['UNSPSC']; |
// some Australian spellings | // some Australian spellings |
$isiz = str_replace("iz", "is", $row['Title']); | $isiz = str_replace("iz", "is", $row['Title']); |
$unspsc[$isiz] = $row['UNSPSC']; | $unspsc[$isiz] = $row['UNSPSC']; |
$filfill = str_replace("fill", "fil", $row['Title']); | $filfill = str_replace("fill", "fil", $row['Title']); |
$unspsc[$filfill] = $row['UNSPSC']; | $unspsc[$filfill] = $row['UNSPSC']; |
$defence = str_replace("efense", "efence", $row['Title']); | $defence = str_replace("efense", "efence", $row['Title']); |
$unspsc[$defence] = $row['UNSPSC']; | $unspsc[$defence] = $row['UNSPSC']; |
$armor = str_replace("rmored", "rmoured", $row['Title']); | $armor = str_replace("rmored", "rmoured", $row['Title']); |
$unspsc[$armor] = $row['UNSPSC']; | $unspsc[$armor] = $row['UNSPSC']; |
$erre = str_replace("er", "re", $row['Title']); | $erre = str_replace("er", "re", $row['Title']); |
$unspsc[$erre] = $row['UNSPSC']; | $unspsc[$erre] = $row['UNSPSC']; |
$center = str_replace("center", "centre", $row['Title']); | |
$unspsc[$center] = $row['UNSPSC']; | |
$accessory = str_replace("accesor", "accessor", $row['Title']); | |
$unspsc[$accessory] = $row['UNSPSC']; | |
$lyslyz = str_replace("lyz", "lys", $row['Title']); | $lyslyz = str_replace("lyz", "lys", $row['Title']); |
$unspsc[$lyslyz] = $row['UNSPSC']; | $unspsc[$lyslyz] = $row['UNSPSC']; |
$tire = str_replace("ire", "yre", $row['Title']); | |
$unspsc[$tire] = $row['UNSPSC']; | |
$pe = str_replace("pe", "pae", $row['Title']); | |
$unspsc[$pe] = $row['UNSPSC']; | |
$ane = str_replace("ane", "anae", $row['Title']); | |
$unspsc[$ane] = $row['UNSPSC']; | |
$airo = str_replace("airplane", "aeroplane", $row['Title']); | |
$unspsc[$airo] = $row['UNSPSC']; | |
// some divergence from standard | // some divergence from standard |
$forensicit = str_replace("Information technology consultation services", "Forensic IT Services", $row['Title']); | |
$unspsc[$forensicit] = $row['UNSPSC']; | |
$powercable = str_replace( "Power cable", "Power cable installation and supply", $row['Title']); | |
$unspsc[$powercable] = $row['UNSPSC']; | |
$tobacco = str_replace("Food Beverage and Tobacco Products", "Food and Beverage Products", $row['Title']); | $tobacco = str_replace("Food Beverage and Tobacco Products", "Food and Beverage Products", $row['Title']); |
$unspsc[$tobacco] = $row['UNSPSC']; | $unspsc[$tobacco] = $row['UNSPSC']; |
$architect = str_replace("Building and Construction and Maintenance Services", "Architectural services", $row['Title']); | $architect = str_replace("Building and Construction and Maintenance Services", "Architectural services", $row['Title']); |
$unspsc[$architect] = $row['UNSPSC']; | |
$powercable = str_replace("Power cable", "Power cable installation and supply", $row['Title']); | |
$unspsc[$powercable] = $row['UNSPSC']; | |
$forensicIT = str_replace("Building and Construction and Maintenance Services", "Architectural services", $row['Title']); | |
$unspsc[$architect] = $row['UNSPSC']; | $unspsc[$architect] = $row['UNSPSC']; |
// some just plain wrong | // some just plain wrong |
$noOilRigs = str_replace("Building and Construction and Maintenance Services", "Management and provision of all facilities engineering modification and maintenance services for a site or platform", $row['Title']); | $noOilRigs = str_replace("Building and Construction and Maintenance Services", "Management and provision of all facilities engineering modification and maintenance services for a site or platform", $row['Title']); |
$unspsc[$noOilRigs] = $row['UNSPSC']; | $unspsc[$noOilRigs] = $row['UNSPSC']; |
} | } |
$query = 'SELECT "CNID","category","value" | $query = 'SELECT "CNID","category","value" |
FROM contractnotice | FROM contractnotice |
WHERE "categoryUNSPSC" IS NULL OR "categoryUNSPSC" = 0'; | WHERE "categoryUNSPSC" IS NULL OR "categoryUNSPSC" = 0'; |
$emptycatresult = $conn->prepare($query); | $emptycatresult = $conn->prepare($query); |
$missing = Array(); | $missing = Array(); |
$emptycatresult->execute(); | $emptycatresult->execute(); |
foreach ($emptycatresult->fetchAll() as $record) { | foreach ($emptycatresult->fetchAll() as $record) { |
if (!isset($unspsc[$record['category']]) || $unspsc[$record['category']] == "") { | if (!isset($unspsc[$record['category']]) || $unspsc[$record['category']] == "") { |
$missing[$record['category']] = (isset($missing[$record['category']]) ? $missing[$record['category']] : 0) + $record['value']; | $missing[$record['category']] = (isset($missing[$record['category']]) ? $missing[$record['category']] : 0) + $record['value']; |
// echo "<br>\n Category not found for: \n"; | // echo "<br>\n Category not found for: \n"; |
// print_r($record); | // print_r($record); |
} else { | } else { |
$result = $conn->exec('UPDATE contractnotice SET "categoryUNSPSC" = | $result = $conn->exec('UPDATE contractnotice SET "categoryUNSPSC" = |
\'' . $unspsc[$record['category']] . '\' where "CNID" = \'' . $record['CNID'] . '\';'); | \'' . $unspsc[$record['category']] . '\' where "CNID" = \'' . $record['CNID'] . '\';'); |
if ($result) { | if ($result) { |
echo $record['CNID'] . " set to " . ($unspsc[$record['category']]) . " <br>\n"; | echo $record['CNID'] . " set to " . ($unspsc[$record['category']]) . " <br>\n"; |
} else { | } else { |
echo "error<br>"; | echo "error<br>"; |
print_r($conn->errorInfo()); | print_r($conn->errorInfo()); |
} | } |
} | } |
} | } |
asort($missing, SORT_NUMERIC); | asort($missing, SORT_NUMERIC); |
print_r($missing); | print_r($missing); |
?> | ?> |
<?php | <?php |
include_once("./lib/common.inc.php"); | include_once("./lib/common.inc.php"); |
setlocale(LC_CTYPE, 'C'); | setlocale(LC_CTYPE, 'C'); |
// source: http://stackoverflow.com/questions/81934/easy-way-to-export-a-sql-table-without-access-to-the-server-or-phpmyadmin#81951 | // source: http://stackoverflow.com/questions/81934/easy-way-to-export-a-sql-table-without-access-to-the-server-or-phpmyadmin#81951 |
$unspsc = Array(); | |
$unspscresult = $conn->prepare('select * from "UNSPSCcategories" where "UNSPSC"::text like \'%00000\';'); | |
$unspscresult->execute(); | |
foreach ($unspscresult->fetchAll() as $row) { | |
$unspsc[$row['UNSPSC']] = $row['Title']; | |
} | |
$query = $conn->prepare(' | $query = $conn->prepare(' |
SELECT "CNID",contractnotice."agencyName",agency.abn as "agencyABN",EXTRACT(EPOCH FROM "publishDate") as "publishDate",EXTRACT(EPOCH FROM "contractStart") as "contractStart",EXTRACT(EPOCH FROM "contractEnd") as "contractEnd",value,description,"procurementMethod",category,"categoryUNSPSC", | SELECT "CNID",contractnotice."agencyName",agency.abn as "agencyABN", |
EXTRACT(EPOCH FROM "publishDate") as "publishDate", | |
EXTRACT(EPOCH FROM "contractStart") as "contractStart", | |
EXTRACT(EPOCH FROM "contractEnd") as "contractEnd", | |
value,description,"procurementMethod",category,"categoryUNSPSC", | |
(substr( "categoryUNSPSC"::text, 0, 2 ) || \'0000000\'::text) as "cat1", | |
(substr( "categoryUNSPSC"::text, 0, 3 ) || \'000000\'::text) as "cat2", | |
(substr( "categoryUNSPSC"::text, 0, 4 ) || \'00000\'::text) as "cat3", | |
"supplierABN","supplierName", | "supplierABN","supplierName", |
( | ( |
case when "supplierABN" != 0 THEN "supplierABN"::text ELSE "supplierName" END) as supplierID, | case when "supplierABN" != 0 THEN "supplierABN"::text ELSE "supplierName" END) as supplierID, |
(\'https://www.tenders.gov.au/?event=public.advancedsearch.keyword&keyword=CN\'::text || "CNID"::text) as sourceURL | (\'https://www.tenders.gov.au/?event=public.advancedsearch.keyword&keyword=CN\'::text || "CNID"::text) as sourceURL |
FROM contractnotice join agency on contractnotice."agencyName"=agency."agencyName" where "childCN" is null' | FROM contractnotice join agency on contractnotice."agencyName"=agency."agencyName" |
where "childCN" is null' | |
, array(PDO::ATTR_CURSOR => PDO::FETCH_ORI_NEXT)); | , array(PDO::ATTR_CURSOR => PDO::FETCH_ORI_NEXT)); |
// "supplierCity","supplierPostcode","supplierCountry","contactPostcode", | // "supplierCity","supplierPostcode","supplierCountry","contactPostcode", |
// (substr( "categoryUNSPSC"::text, 0, 2 ) || \'0000000\'::text) as "categoryUNSPSClv1", "categoryUNSPSC", (substr( "categoryUNSPSC"::text, 0, 3 ) || \'000000\'::text) as "categoryUNSPSClv2" "categoryUNSPSC", (substr( "categoryUNSPSC"::text, 0, 4 ) || \'00000\'::text as "categoryUNSPSClv3") | // |
$query->execute(); | $query->execute(); |
$errors = $conn->errorInfo(); | $errors = $conn->errorInfo(); |
if ($errors[2] != "") { | if ($errors[2] != "") { |
die("Export terminated, db error" . print_r($errors, true)); | die("Export terminated, db error" . print_r($errors, true)); |
} | } |
$num_fields = $query->columnCount(); | $num_fields = $query->columnCount(); |
$headers = array(); | $headers = Array(); |
for ($i = 0; $i < $num_fields; $i++) { | for ($i = 0; $i < $num_fields; $i++) { // for each column in query, make a CSV header |
$meta = $query->getColumnMeta($i); | $meta = $query->getColumnMeta($i); |
$headers[] = $meta['name']; | $headers[] = $meta['name']; |
} | } |
$fp = fopen('php://output', 'w'); | $fp = fopen('php://output', 'w'); |
if ($fp && $query) { | if ($fp && $query) { |
header('Content-Type: text/csv'); | header('Content-Type: text/csv'); |
header('Content-Disposition: attachment; filename="export.' . date("c") . '.csv"'); | header('Content-Disposition: attachment; filename="export.' . date("c") . '.csv"'); |
header('Pragma: no-cache'); | header('Pragma: no-cache'); |
header('Expires: 0'); | header('Expires: 0'); |
fputcsv($fp, $headers); | fputcsv($fp, $headers); |
while ($row = $query->fetch(PDO::FETCH_NUM, PDO::FETCH_ORI_NEXT)) { | while ($row = $query->fetch(PDO::FETCH_NUM, PDO::FETCH_ORI_NEXT)) { |
foreach ($row as $key => &$colvalue) { | foreach ($row as $key => &$colvalue) { |
$colvalue = preg_replace('/[^[:print:]]/', '', utf8_encode($colvalue)); | $colvalue = preg_replace('/[^[:print:]]/', '', utf8_encode($colvalue)); |
if ($headers[$key] == "publishDate" || $headers[$key] == "contractStart" | if ($headers[$key] == "publishDate" || $headers[$key] == "contractStart" |
|| $headers[$key] == "contractEnd") { | || $headers[$key] == "contractEnd") { |
$colvalue = date("Y-m-d", $colvalue); | $colvalue = date("Y-m-d", $colvalue); |
} | } |