Ejemplo n.º 1
0
<?php

// If necessary, reference the sdk.class.php file.
// For example, the following line assumes the sdk.class.php file is
// in an sdk sub-directory relative to this file
require_once dirname(__FILE__) . '/vendor/amazonwebservices/aws-sdk-for-php/sdk.class.php';
// Instantiate the class.
$dynamodb = new AmazonDynamoDB(array('key' => getenv('AWS_ACCESS_KEY'), 'secret' => getenv('AWS_SECRET_KEY')));
$dynamodb->set_region('dynamodb.' . getenv('AWS_REGION') . '.amazonaws.com');
$fourteen_days_ago = date('Y-m-d H:i:s', strtotime("-14 days"));
$response = $dynamodb->query(array('TableName' => 'Reply', 'HashKeyValue' => array(AmazonDynamoDB::TYPE_STRING => 'Amazon DynamoDB#DynamoDB Thread 2'), 'RangeKeyCondition' => array('ComparisonOperator' => AmazonDynamoDB::CONDITION_GREATER_THAN_OR_EQUAL, 'AttributeValueList' => array(array(AmazonDynamoDB::TYPE_STRING => $fourteen_days_ago)))));
header('content-type: text/plain');
// Response code 200 indicates success
print_r($response);
?>

Ejemplo n.º 2
0
 private function _retailer_lookup_deprecated($api, $search_url, $upcs, $floor_price, $cron_log_id, $store_id)
 {
     foreach ($upcs as $key => $upc) {
     }
     // only one index
     $price_floor = $floor_price[$key]['floor_price'];
     $retailer_data = $this->_spider_search($upc, $api, $search_url);
     if (!isset($retailer_data[0])) {
         $this->updateUPCFlag($upc, $api, '0');
         return;
     }
     $this->myDB = new mydb();
     $avg_price = 0;
     $n = 0;
     $violationFlag = false;
     $uniquArr = array();
     foreach ($retailer_data as $item) {
         $this->stats[$api]['data_found']++;
         $crawled_product = array();
         $violation = array();
         $author = $this->getMerchantNameForKey($api, $upc, $api, $api, $api, $search_url);
         if (empty($author)) {
             // assert dummy value
             $author = "No name found.";
         }
         $stQuery = "UPDATE cron_log set google_count=(google_count+1), last_UPC='{$upc}' WHERE id= '{$cron_log_id}' ";
         $this->myDB->simpleQuery($stQuery);
         $hashKey = $author . '#' . $upc;
         $crawled_product['um'] = $hashKey;
         $crawled_product['dt'] = time();
         $crawled_product['ap'] = $price_floor;
         $crawled_product['t'] = isset($item['product.name']) ? $item['product.name'] : '';
         $crawled_product['mu'] = isset($item['seller.aboutus']) ? $item['seller.aboutus'] : '';
         $crawled_product['l'] = isset($item['product.url']) ? $item['product.url'] : '';
         $crawled_product['ar'] = $api;
         $crawled_product['mil'] = isset($item['seller.logo']) ? $item['seller.logo'] : '';
         $crawled_product['il'] = isset($item['product.image_url']) ? $item['product.image_url'] : '';
         $crawled_product['mpo'] = isset($item['product.price_listed']) ? $this->parseDollarAmount($item['product.price_listed']) : 0;
         $crawled_product['msp'] = isset($item['product.shipping']) ? $item['product.shipping'] : 0;
         if ($crawled_product['mpo']) {
             $this->stats[$api]['price_found']++;
             $avg_price = $this->_new_avg($avg_price, $crawled_product['mpo']);
             // Get the price from the last crawl
             $dynamo = new AmazonDynamoDB();
             $lastRecordResponse = $dynamo->query(array('TableName' => $this->_dynamo_products_trends, 'HashKeyValue' => array(AmazonDynamoDB::TYPE_STRING => $crawled_product['um']), 'ConsistentRead' => true, 'Limit' => 1, 'ScanIndexForward' => false));
             $insert_response = $this->amzdb->insertData($this->_dynamo_products_trends, $crawled_product, $api);
             if (isset($insert_response->status) && $insert_response->status == 200) {
                 $this->insertUPCMerchant($author, $upc, $api, $crawled_product['mpo'], $api, $api);
             }
             // get the corresponding crowlMerchantName row
             $crowlMerchantName = $this->Crawl_data->crowlMerchantBySellerID($api);
             if (empty($crowlMerchantName)) {
                 log_message('error', __FILE__ . ' Crowl_m::' . $api . '_lookup() Line ' . __LINE__ . ': crowl_merchant_name record not found for seller ID ' . $api);
             }
             $crowlMerchantNameID = isset($crowlMerchantName->id) ? $crowlMerchantName->id : 0;
             $violatedPrice = (double) $crawled_product['mpo'];
             $dataVio = $this->Products->get_products_by_floor($upc, $violatedPrice, $store_id);
             if ($dataVio) {
                 $violation['um'] = $hashKey;
                 $violation['dt'] = $crawled_product['dt'];
                 $violation['ss'] = date('Ymd', $violation['dt']) . '/' . md5($hashKey . $violation['dt']) . '.png';
                 $this->updateViolationSummary($dataVio);
                 $this->Violator->updatePriceViolator($crowlMerchantNameID, $upc, 1, $crawled_product['dt']);
                 $lastCrawlPrice = (double) 0;
                 $hashKey = null;
                 $rangeKey = null;
                 if ($lastRecordResponse->isOK()) {
                     $mpo = isset($lastRecordResponse->body->Items->mpo->N) ? (double) $lastRecordResponse->body->Items->mpo->N : (double) 0;
                     // Merchant Price Offered
                     $lastCrawlPrice = $mpo;
                     $hashKey = isset($lastRecordResponse->body->Items->um->S) ? $lastRecordResponse->body->Items->um->S : null;
                     $rangeKey = isset($lastRecordResponse->body->Items->dt->N) ? $lastRecordResponse->body->Items->dt->N : null;
                 }
                 // Check if the price has changed
                 if ((double) $lastCrawlPrice != (double) $violatedPrice) {
                     if (!isset($uniquArr[$crawled_product['l']])) {
                         $uniquArr[$crawled_product['l']] = $violation['ss'];
                         $this->addScreenShot($crawled_product['l'], $violation['ss'], false, $violatedPrice);
                     } else {
                         $violation['ss'] = $uniquArr[$crawled_product['l']];
                     }
                 } else {
                     $takeNewScreenShot = true;
                     // Get the violation screen shot
                     if (!empty($hashKey) and !empty($rangeKey)) {
                         $lastViolationResponse = $dynamo->query(array('TableName' => $this->_dynamo_violations, 'HashKeyValue' => array(AmazonDynamoDB::TYPE_STRING => (string) $hashKey), 'RangeKeyCondition' => array('ComparisonOperator' => AmazonDynamoDB::CONDITION_EQUAL, 'AttributeValueList' => array(array(AmazonDynamoDB::TYPE_NUMBER => (string) $rangeKey))), 'ConsistentRead' => 'true'));
                         if ($lastViolationResponse->isOK() and $lastViolationResponse->body->Count == 1) {
                             if (isset($lastViolationResponse->body->Items->ss->S)) {
                                 if (@fopen(get_instance()->config->item('s3_cname') . 'stickyvision/violations/' . $lastViolationResponse->body->Items->ss->S, 'r')) {
                                     $violation['ss'] = $lastViolationResponse->body->Items->ss->S;
                                     $takeNewScreenShot = false;
                                 }
                             }
                         }
                     }
                     if ($takeNewScreenShot === true) {
                         $this->addScreenShot($crawled_product['l'], $violation['ss'], false, $violatedPrice);
                     }
                 }
                 $this->amzdb->insertData($this->_dynamo_violations, $violation, $api);
                 $violationFlag = true;
                 unset($dataVio);
             } else {
                 // update price violators for products not in violation
                 $this->Violator->updatePriceViolator($crowlMerchantNameID, $upc, 0, $crawled_product['dt']);
             }
             $n++;
         } else {
             email_alertToTeam($api . '_lookup', 'Product data found, but price not found for UPC ' . $upc);
         }
         unset($retailer_data, $crawled_product, $violation);
     }
     $this->myDB->close();
     $this->updateUPCFlag($upc, $api, '1');
 }
Ejemplo n.º 3
0
 public function run()
 {
     $this->_start_time = date('Y-m-d H:i:s');
     $this->_cron_log_id = $this->Log->create_log($this->_start_time);
     //need to get all products
     $productCount = $this->Products->get_all_tracked_products_count();
     $offset = 0;
     //queue up products -- so we don't crash the machine with a lot of products
     do {
         $products = $this->Products->get_all_tracked_products();
         $this->_products = array_merge($products, $this->_products);
         $this->_numproducts += count($products);
         $offset += 500;
     } while ($offset < $productCount);
     if (count($this->_crawlers) > 0) {
         foreach ($this->_crawlers as $crawler) {
             $crawlerName = strtolower(trim($crawler['name']));
             $filePath = FCPATH . 'system/application/crawlers/' . $crawlerName . '.php';
             //check to see if crawler exists
             if (@file_exists($filePath) === false) {
                 throw new Exception('The crawler ' . $crawlerName . ' file does not exist. Please add it.');
             }
             require_once $filePath;
             if (class_exists($crawlerName) === false) {
                 throw new Exception('The crawler ' . $crawlerName . ' crawler class is not available. Please check that its defined within the file');
             }
             $this->_currentCrawler = $crawlerName;
             $this->_crawlerClass = new $crawlerName($crawler);
             foreach ($this->_products as $product) {
                 if ($product === end($this->_products)) {
                     $this->_last_upc = $product->upc_code;
                 }
                 try {
                     $this->_current_product_id = $product->id;
                     $this->_crawlerClass->setIdentifier($product->upc_code);
                     $productData = $this->_crawlerClass->getProduct();
                     $offers = $this->_crawlerClass->getAllOffers();
                     $this->_numfoundproducts++;
                     foreach ($offers as $offer) {
                         $this->_numofferings++;
                         $crawled_products = array();
                         if (empty($offer['merchant'])) {
                             throw new Exception('Merchant not defined.');
                         }
                         $marketplace = $offer['marketplace'];
                         if (empty($marketplace)) {
                             throw new Exception('Marketplace not defined');
                         }
                         $r = preg_split('/(?=\\.[^.]+$)/', $marketplace);
                         $marketplace = strtolower($r[0]);
                         $merchant = $this->Crowl->getMerchantNameForKey($offer['merchant'], $product->upc_code, $marketplace, $offer['merchant'], $offer['merchant'], extractDomainByURL($offer['url']));
                         $this->_marketplaces[] = $offer['marketplace'];
                         if (empty($offer['price_floor']) || !is_numeric($offer['price_floor'])) {
                             throw new Exception('Price floor is undefined');
                         }
                         $crawled_products['ap'] = $offer['price_floor'];
                         $title = $productData->get("title");
                         if (empty($title)) {
                             throw new Exception('Title is undefined');
                         }
                         $crawled_products['t'] = $title;
                         $crawled_products['ar'] = $marketplace;
                         $crawled_products['il'] = null;
                         if (empty($offer['url'])) {
                             throw new Exception('Url is undefined');
                         }
                         $crawled_products['l'] = $offer['url'];
                         $crawled_products['mu'] = $offer['merchant_url'];
                         if (empty($offer['price']) || !is_numeric($offer['price'])) {
                             throw new Exception('Price is undefined');
                         }
                         $crawled_products['mpo'] = $offer['price'];
                         $hashKey = $marketplace . '#' . $product->upc_code;
                         $crawled_products['um'] = $hashKey;
                         $crawled_products['dt'] = time();
                         // Get the price from the last crawl
                         $dynamo = new AmazonDynamoDB();
                         $lastRecordResponse = $dynamo->query(array('TableName' => $this->_dynamo_products_trends, 'HashKeyValue' => array(AmazonDynamoDB::TYPE_STRING => $crawled_products['um']), 'ConsistentRead' => true, 'Limit' => 1, 'ScanIndexForward' => false));
                         var_dump($crawled_products);
                         $insert_response = $this->amzdb->insertData($this->_dynamo_products_trends, $crawled_products, $marketplace);
                         if (isset($insert_response->status) && $insert_response->status == 200) {
                             $this->Crowl->insertUPCMerchant($merchant, $product->upc_code, $marketplace, $crawled_products['mpo']);
                         }
                         $crowlMerchantName = $this->Crawl_data->crowlMerchantByMerchantName($merchant);
                         if (empty($crowlMerchantName)) {
                             log_message('error', __FILE__ . ' Crowl_m::amazon_lookup() Line ' . __LINE__ . ': crowl_merchant_name record not found for merchant ' . $offer['merchant']);
                         }
                         $crowlMerchantNameID = isset($crowlMerchantName->id) ? $crowlMerchantName->id : 0;
                         $violatedPrice = (double) $crawled_products['mpo'];
                         $dataVio = $this->Products->get_products_by_floor($product->upc_code, $violatedPrice, $product->store_id);
                         if ($dataVio) {
                             //$price_floor > $crowled_products['mpo'])
                             $violation['um'] = $hashKey;
                             $violation['dt'] = $crawled_products['dt'];
                             //time();
                             $violation['ss'] = date('Ymd', $violation['dt']) . '/' . md5($hashKey . $violation['dt']) . '.png';
                             $this->Crowl->updateViolationSummary($dataVio);
                             $this->Violator->updatePriceViolator($crowlMerchantNameID, $product->upc_code, 1, $crawled_products['dt']);
                             $lastCrawlPrice = (double) 0;
                             $hashKey = null;
                             $rangeKey = null;
                             if ($lastRecordResponse->isOK()) {
                                 $mpo = isset($lastRecordResponse->body->Items->mpo->N) ? (double) $lastRecordResponse->body->Items->mpo->N : (double) 0;
                                 // Merchant Price Offered
                                 $lastCrawlPrice = $mpo;
                                 $hashKey = isset($lastRecordResponse->body->Items->um->S) ? $lastRecordResponse->body->Items->um->S : null;
                                 $rangeKey = isset($lastRecordResponse->body->Items->dt->N) ? $lastRecordResponse->body->Items->dt->N : null;
                             }
                             // Check if the price has changed
                             if ($lastCrawlPrice != $violatedPrice) {
                                 if (!isset($uniquArr[$crawled_products['l']])) {
                                     $uniquArr[$crawled_products['l']] = $violation['ss'];
                                     $this->Crowl->addScreenShot($crawled_products['l'], $violation['ss'], false, $violatedPrice);
                                 } else {
                                     $violation['ss'] = $uniquArr[$crawled_products['l']];
                                 }
                             } else {
                                 $takeNewScreenShot = false;
                                 // Get the violation screen shot
                                 if (!is_null($hashKey) and !is_null($rangeKey)) {
                                     $lastViolationResponse = $dynamo->query(array('TableName' => $this->_dynamo_violations, 'HashKeyValue' => array(AmazonDynamoDB::TYPE_STRING => (string) $hashKey), 'RangeKeyCondition' => array('ComparisonOperator' => AmazonDynamoDB::CONDITION_EQUAL, 'AttributeValueList' => array(array(AmazonDynamoDB::TYPE_NUMBER => (string) $rangeKey)))));
                                     if ($lastViolationResponse->isOK() and $lastViolationResponse->body->Count == 1) {
                                         if (isset($lastViolationResponse->body->Items->ss->S)) {
                                             if (@fopen(get_instance()->config->item('s3_cname') . 'stickyvision/violations/' . $lastViolationResponse->body->Items->ss->S, 'r')) {
                                                 $violation['ss'] = $lastViolationResponse->body->Items->ss->S;
                                                 $takeNewScreenShot = false;
                                             } else {
                                                 $takeNewScreenShot = true;
                                             }
                                         }
                                     }
                                 }
                                 if ($takeNewScreenShot === true) {
                                     $this->Crowl->addScreenShot($crawled_products['l'], $violation['ss'], false, $violatedPrice);
                                 }
                             }
                             $this->amzdb->insertData($this->_dynamo_violations, $violation, $marketplace);
                             $violationFlag = true;
                             $violation = null;
                         } else {
                             // update price violators for products not in violation
                             $this->Violator->updatePriceViolator($crowlMerchantNameID, $product->upc_code, 0, $crawled_products['dt']);
                         }
                         $this->Crowl->updateUPCFlag($product->upc_code, $marketplace, '1');
                     }
                     //end offers iteration
                     $this->_crawlerClass->reset();
                 } catch (Exception $e) {
                     $exceptionDetail = array('crawler_log_id' => $this->_cron_log_id, 'crawler_name' => $this->_currentCrawler, 'message' => $e->getMessage(), 'created_at' => date('Y-m-d H:i:s'), 'product_id' => $this->_current_product_id);
                     echo 'exception detected..';
                     var_dump($exceptionDetail);
                     $this->CrawlerErrorLog->create_log($exceptionDetail);
                     //send an alert to the team
                     email_alertToTeam('Run Cron Job - Error Cron Log ID ' . $this->_cron_log_id . ' : ' . $e->getMessage());
                 }
             }
         }
     }
     $this->_end_time = date('Y-m-d H:i:s');
     $this->Log->update_log($this->_cron_log_id, array('end_datetime' => $this->_end_time, 'products_count' => $this->_numfoundproducts, 'offerings_count' => $this->_numofferings));
     //create cron_log -- this is needed to handle code that still thinks we need to use old crawler
     $this->_marketplaces = array_unique($this->_marketplaces);
     foreach ($this->_marketplaces as $marketplace) {
         $domain = trim($marketplace);
         $r = preg_split('/(?=\\.[^.]+$)/', $domain);
         $marketplace = strtolower($r[0]);
         $cron_log_id = $this->CronLog->create_log(array('datetime' => date('Y-m-d H:i:s'), 'key' => generate_rand(32), 'api_type' => $marketplace, 'start_datetime' => $this->_start_time, 'end_datetime' => $this->_end_time, 'google_count' => 0, 'last_UPC' => $this->_last_upc, 'run_from' => 'cronTab1'));
         $this->Marketplace->add_retailer(strtolower($marketplace), strtolower($domain));
     }
     exit;
 }