Parse.php 2.2 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899
  1. <?php
  2. namespace Spider\Lib;
  3. use Dever;
  4. class Parse
  5. {
  6. private $url = '';
  7. private $host = '';
  8. private $log;
  9. private $doc = array();
  10. private $data = array();
  11. public function __construct($url, $project, $rule, $col)
  12. {
  13. $doc = Doc::getInstance($url, $rule);
  14. $doc->log(new Log($project));
  15. $data = $doc->get();
  16. if ($data) {
  17. if (!is_array($data) && !is_object($data)) {
  18. $data = Dever::json_decode($data);
  19. }
  20. if ($data) {
  21. $domain = parse_url($url);
  22. $host = $domain['scheme'] . '://' . $domain['host'];
  23. foreach ($data as $k => $v) {
  24. if (!strstr($v, 'http')) {
  25. $v = $host . $v;
  26. }
  27. $this->data[$k] = $this->load($doc, $v, $col, $project);
  28. }
  29. }
  30. }
  31. $doc->saveLog();
  32. }
  33. public function get()
  34. {
  35. return $this->data;
  36. }
  37. private function load($doc, $data, $col, $project)
  38. {
  39. $result = $table = array();
  40. $data = $doc->init($data);
  41. foreach ($col as $v) {
  42. $callback = false;
  43. if (strpos($v['key'], '.') !== false) {
  44. $temp = explode('.', $v['key']);
  45. $v['key'] = $temp[1];
  46. $callback = $temp[0];
  47. }
  48. $value = $doc->rule($data, $col, $v);
  49. if ($value == 'error') {
  50. break;
  51. }
  52. if ($callback) {
  53. if (function_exists($callback)) {
  54. $value = $callback($value);
  55. } else {
  56. $value = Dever::{$callback}($value);
  57. }
  58. }
  59. $result[$v['key']] = $value;
  60. if (Dever::input('test') == 1) {
  61. $table[$v['name']] = $value;
  62. }
  63. }
  64. if (Dever::input('test') == 1) {
  65. $doc->outLog();
  66. print_r(Dever::table($table));die;
  67. }
  68. $this->update($result, $project);
  69. return $result;
  70. }
  71. private function update($data, $project)
  72. {
  73. $param['option_pid'] = $project;
  74. $param['option_value'] = json_encode($data, JSON_UNESCAPED_UNICODE);
  75. $info = Dever::db('spider/data')->one($param);
  76. if ($info) {
  77. $update = array();
  78. foreach ($param as $i => $j) {
  79. $i = str_replace('option_', 'set_', $i);
  80. $update[$i] = $j;
  81. }
  82. $id = $update['where_id'] = $info['id'];
  83. Dever::db('spider/data')->update($update);
  84. } else {
  85. $update = array();
  86. foreach ($param as $i => $j) {
  87. $i = str_replace('option_', 'add_', $i);
  88. $update[$i] = $j;
  89. }
  90. $id = Dever::db('spider/data')->insert($update);
  91. }
  92. }
  93. }