Exemple #1
0
 def schedule(self,
              project_name,
              spider_name,
              priority=0,
              setting=None,
              job_id=None,
              version=None,
              args={}):
     """
     Schedule a spider run , return job id
     """
     url, method = self.command_set["schedule"]
     data = {}
     data["project"] = project_name
     data["priority"] = priority
     data["spider"] = spider_name
     if setting is not None:
         data["setting"] = setting
     if job_id is not None:
         data["jobid"] = job_id
     if version is not None:
         data["_version"] = version
     for k, v in args.items():
         data[k] = v
     response = http_utils.request(url,
                                   method_type=method,
                                   data=data,
                                   return_type=http_utils.RETURN_JSON)
     return response
Exemple #2
0
 def get_project_list(self):
     """
     Get the list of projects uploaded to this scrapy server
     """
     url, method = self.command_set["listprojects"]
     response = http_utils.request(url,
                                   method_type=method,
                                   return_type=http_utils.RETURN_JSON)
     return response
Exemple #3
0
 def get_logs(self, project_name, spider_name):
     """
     Get urls that scrapd logs file by project name and spider name
     """
     url, method = self.command_set["logs"]
     url = url + "/" + spider.name + "/"
     response = http_utils.request(url, method_type=method)
     html_parser = ScrapyLogsPageHTMLParser()
     html_parser.feed(response)
     html_parser.clean_enter_sign()
     return html_parser.result, [url + x for x in html_parser.result]
Exemple #4
0
 def delete_project(self, project_name):
     """
     Delete a project and all its uploaded versions
     """
     url, method = self.command_set["delproject"]
     data = {"project": project_name}
     response = http_utils.request(url,
                                   method_type=method,
                                   data=data,
                                   return_type=http_utils.RETURN_JSON)
     return response
Exemple #5
0
 def get_job_list(self, project_name):
     """
     Get the list of pending, running and finished jobs of some project.
     """
     url, method = self.command_set["listjobs"]
     data = {"project": project_name}
     response = http_utils.request(url,
                                   method_type=method,
                                   data=data,
                                   return_type=http_utils.RETURN_JSON)
     return response
Exemple #6
0
 def get_version_list(self, project_name):
     """
     Get the list of versions avaliabel for some project
     """
     url, method = self.command_set["listversions"]
     data = {"project": project_name}
     response = http_utils.request(url,
                                   method_type=method,
                                   data=data,
                                   return_type=http_utils.RETURN_JSON)
     return response
Exemple #7
0
    def get_load_status(self):
        """
        To check the load status of a service
        return : a dictionary that include json data
                example:{"status":"ok", "runnning":"0", "pendding":"0", "finished":"0", "node_name":"node_name"}
        """

        url, method = self.command_set["daemonstatus"]
        response = http_utils.request(url,
                                      method_type=method,
                                      return_type=http_utils.RETURN_JSON)
        return response
Exemple #8
0
 def delete_project_version(self, project_name, version):
     """
     Delete a project version
     if there are no more versions avaliabel for a given project.
     the project will be delted too.
     """
     url, method = self.command_set["delversion"]
     data = {"project": project_name, "version": version}
     response = http_utils.request(url,
                                   method_type=method,
                                   data=data,
                                   return_type=http_utils.RETURN_JSON)
     return response
Exemple #9
0
 def get_spider_list(self, project_name, version=None):
     """
     Get the list of spiders avalabel in the last version of some project
     """
     url, method = self.command_set["listspdiers"]
     data = {}
     data["project"] = project_name
     if version is not None:
         data["_version"] = version
     response = http_utils.request(url,
                                   method_type=method,
                                   data=data,
                                   return_type=http_utils.RETURN_JSON)
     return response
Exemple #10
0
 def cancel(self, project_name, job_id):
     """
     Cancel a spider run,if the job is pending it will be removed,
     if the job is running ,it will be terminated
     """
     url, method = self.command_set["cancel"]
     data = {}
     data["project"] = project_name
     data["job"] = job_id
     response = http_utils.request(url,
                                   method_type=method,
                                   data=data,
                                   return_type=http_utils.RETURN_JSON)
     return json.loads(response)
Exemple #11
0
 def add_version(self, project_name, version, egg):
     """
     Add a version to a project, creating the project if it doesn't exist
     """
     url, method = self.command_set["addversion"]
     data = {}
     data["project"] = project_name
     data["version"] = version
     data["egg"] = egg
     response = http_utils.request(url,
                                   method_type=method,
                                   data=data,
                                   return_type=http_utils.RETURN_JSON)
     return response