From: Alexander Sadleir Date: Wed, 21 Mar 2012 03:18:54 +0000 Subject: Merge branch 'master' of ssh://apples.lambdacomplex.org/git/contractdashboard X-Git-Url: http://maxious.lambdacomplex.org/git/?p=contractdashboard.git&a=commitdiff&h=6e3b80c17d8ed9f0afe0db0403d9e82652250364 --- Merge branch 'master' of ssh://apples.lambdacomplex.org/git/contractdashboard --- --- a/admin/linkAmendments.php +++ b/admin/linkAmendments.php @@ -1,6 +1,9 @@ prepare($query); + $query->execute(); + $query = 'update contractnotice set "supplierABN" = null where "supplierABN" = \'0\''; $query = $conn->prepare($query); $query->execute(); $query = 'SELECT c."CNID",c."parentCN",p."childCN" FROM contractnotice as c LEFT OUTER JOIN contractnotice as p on c."parentCN" = p."CNID" --- /dev/null +++ b/admin/partialdata/scraper.txt @@ -1,1 +1,74 @@ += 1024 && $i < 4; $i++) $size /= 1024; + return round($size, 2).$units[$i]; +} +$days = 4; +if (isset($_REQUEST['days'])) $days = $_REQUEST['days']; +$startDate = strtotime("05-Jun-2008"); +if (isset($_REQUEST['startDate'])) $startDate = $_REQUEST['startDate']; + +function getFile($startDate, $days, $minVal, $maxVal) { +global $split; + $endDate = strtotime(date("Y-m-d", $startDate)." +".$days." days"); +$file = date("dMY",$startDate).'to'.date("dMY",$endDate).'val'.$minVal.'to'.$maxVal.'.xls'; +echo "Fetching $file ($days days) ($minVal < value < $maxVal )... "; +$url = "https://www.tenders.gov.au/?event=public.advancedsearch.CNSONRedirect&type=cnEvent&atmType=archived%2Cclosed%2Cpublished%2Cproposed&agencyUUID=&agencyStatus=-1&portfolioUUID=&keyword=&KeywordTypeSearch=AllWord&CNID=&dateType=Publish+Date&dateStart=".date("d-M-Y",$startDate)."&dateEnd=".date("d-M-Y",$endDate)."&supplierName=&supplierABN=&valueFrom=".$minVal."&valueTo=".$maxVal."&ATMID=&AgencyRefId=&consultancy=&download=Download+results"; +echo ""; +$current = file_get_contents($url); +if (strpos($current,"There are no results that match your selection.")> 0 ) { + echo "Empty file!
"; +} +if (strpos($current,"Your search returned more than 1000 results.") === false) { + file_put_contents($file, $current); + echo "$file saved
"; + echo format_bytes(filesize($file))."
"; + echo 'Load next '.($days).' days
'; + echo 'Load next '.($days*2).' days
'; + echo 'Load next '.($days).' days with split
'; + flush(); +if (!isset($_REQUEST['split']) && !$split) { +echo "Success so fetching next $days...
"; +getFile($endDate, $days, "" , ""); +} + return true; +} else { + echo "Too many records!
"; + echo 'Load '.($days/2).' days instead?
'; + echo 'Split instead?
'; + flush(); +if (!isset($_REQUEST['split']) && !$split) { +echo "Failure so splitting ...
"; + doSplit($startDate, $days); +} + return false; +} +} +function doSplit($startDate, $days) { +global $split; +$split = true; +set_time_limit(20); +getFile($startDate, $days, 0, 12000); +getFile($startDate, $days, 12000, 16000); + getFile($startDate, $days, 16000, 20000); + getFile($startDate, $days, 20000, 30000); + getFile($startDate, $days, 30000, 40000); +// getFile($startDate, $days, 40000, 80000); + getFile($startDate, $days, 40000, 60000); + getFile($startDate, $days, 60000, 80000); +// getFile($startDate, $days, 80000, 300000); + getFile($startDate, $days, 80000, 150000); + getFile($startDate, $days, 150000, 300000); + getFile($startDate, $days, 300000, 999999999); +} +if (isset($_REQUEST['split'])) { + doSplit($startDate, $days); +} else { + getFile($startDate, $days, "" , ""); +} +?> + --- a/displaySupplier.php +++ b/displaySupplier.php @@ -5,9 +5,9 @@ include_header("Supplier"); $supplierS = htmlentities(strip_tags($_REQUEST['supplier'])); - MethodCountGraph($supplierS); - CnCGraph($supplierS); - MethodValueGraph($supplierS); + // MethodCountGraph($supplierS); + // CnCGraph($supplierS); + // MethodValueGraph($supplierS); /* lobbyist ties links to ABR/ASIC/Google News/ASX/Court records @@ -27,12 +27,16 @@ echo $query; $query = $conn->prepare($query); -//$query->bindParam(":supplierName", $supplierName); + + if ($supplierParts[0] > 0) { $query->bindParam(":supplierABN", $supplierABN); + } else { + $query->bindParam(":supplierName", $supplierName); + } $query->execute(); databaseError($conn->errorInfo()); - echo ''; - echo ''; + // echo ''; + // echo ''; echo " --- a/lib/graphs.inc.php +++ b/lib/graphs.inc.php @@ -27,7 +27,11 @@ var d1 = []; var d2 = []; prepare($query); $query->execute(); $errors = $conn->errorInfo(); @@ -40,7 +44,9 @@ echo "d1.push([ " . intval($delta['cnid']) . ", " . intval($delta['count']) . "]); \n"; }; - $query = 'select cnid, count(*) from (select ("CNID" - MOD("CNID",100)) as cnid from contractnotice where "CNID" < 999999 and "parentCN" is not null) as a group by cnid order by cnid'; + $query = 'select cnid, count(*) from (select ("CNID"::integer - MOD("CNID"::integer,100)) as cnid + from contractnotice where "CNID" not like \'%-A%\' and "parentCN" is not null) + as a group by cnid order by cnid'; $query = $conn->prepare($query); $query->execute(); $errors = $conn->errorInfo(); @@ -71,7 +77,7 @@ points: { show: true } }, bars: { show: true } - }, + }] ]; var options = {