Example #1
0
	def __init__(self, config, db):
		self.config = config
		self.db = db
		self.lookup = LookupTables()
		self.legacy = Legacy(config)
		self.VIDEO_BOOK_SET = {"MAT","MRK","LUK","JHN"}
		self.VIDEO_BOOK_MAP = {"Mark": "MRK", "MRKZ": "MRK", "Luke": "LUK"}
Example #2
0
 def legacy_search_user_by_email(self, email):
     assert isinstance(email, (str, unicode)), email
     headers, data = self.__requester.requestAndCheck(
         "GET", "/legacy/user/email/" + email, None, None)
     return NamedUser.NamedUser(self.__requester,
                                Legacy.convertUser(data["user"]),
                                completed=False)
Example #3
0
 def legacy_search_user_by_email(self, email):
     """
     :calls: `GET /legacy/user/email/:email <http://developer.github.com/v3/search/legacy>`_
     :param email: string
     :rtype: :class:`github.NamedUser.NamedUser`
     """
     assert isinstance(email, (str, unicode)), email
     headers, data = self.__requester.requestJsonAndCheck("GET", "/legacy/user/email/" + email)
     return github.NamedUser.NamedUser(self.__requester, headers, Legacy.convertUser(data["user"]), completed=False)
Example #4
0
 def legacy_search_user_by_email( self, email ):
     assert isinstance( email, ( str, unicode ) ), email
     headers, data = self.__requester.requestAndCheck(
         "GET",
         "/legacy/user/email/" + email,
         None,
         None
     )
     return NamedUser.NamedUser( self.__requester, Legacy.convertUser( data[ "user" ] ), completed = False )
Example #5
0
 def legacy_search_users(self, keyword):
     assert isinstance(keyword, (str, unicode)), keyword
     return Legacy.PaginatedList(
         "/legacy/user/search/" + urllib.quote(keyword),
         {},
         self.__requester,
         "users",
         Legacy.convertUser,
         NamedUser.NamedUser,
     )
Example #6
0
 def legacy_search_issues(self, state, keyword):
     assert state in ["open", "closed"], state
     assert isinstance(keyword, (str, unicode)), keyword
     headers, data = self._requester.requestAndCheck(
         "GET", "/legacy/issues/search/" + self.owner.login + "/" +
         self.name + "/" + state + "/" + urllib.quote(keyword), None, None)
     return [
         Issue.Issue(self._requester,
                     Legacy.convertIssue(element),
                     completed=False) for element in data["issues"]
     ]
Example #7
0
 def legacy_search_issues(self, state, keyword):
     assert state in ["open", "closed"], state
     assert isinstance(keyword, (str, unicode)), keyword
     headers, data = self._requester.requestAndCheck(
         "GET",
         "/legacy/issues/search/" + self.owner.login + "/" + self.name + "/" + state + "/" + urllib.quote(keyword),
         None,
         None,
     )
     return [
         Issue.Issue(self._requester, Legacy.convertIssue(element), completed=False) for element in data["issues"]
     ]
Example #8
0
 def legacy_search_user_by_email(self, email):
     """
     :calls: `GET /legacy/user/email/:email <http://developer.github.com/v3/search/legacy>`_
     :param email: string
     :rtype: :class:`github.NamedUser.NamedUser`
     """
     assert isinstance(email, (str, unicode)), email
     headers, data = self.__requester.requestJsonAndCheck(
         "GET",
         "/legacy/user/email/" + email
     )
     return github.NamedUser.NamedUser(self.__requester, headers, Legacy.convertUser(data["user"]), completed=False)
Example #9
0
 def legacy_search_users(self, keyword):
     """
     :calls: `GET /legacy/user/search/:keyword <http://developer.github.com/v3/search/legacy>`_
     :param keyword: string
     :rtype: :class:`github.PaginatedList.PaginatedList` of :class:`github.NamedUser.NamedUser`
     """
     assert isinstance(keyword, (str, unicode)), keyword
     return Legacy.PaginatedList(
         "/legacy/user/search/" + urllib.quote_plus(keyword, safe='/%:><'),
         {},
         self.__requester,
         "users",
         Legacy.convertUser,
         github.NamedUser.NamedUser,
     )
Example #10
0
 def legacy_search_repos(self, keyword, language=GithubObject.NotSet):
     assert isinstance(keyword, (str, unicode)), keyword
     assert language is GithubObject.NotSet or isinstance(
         language, (str, unicode)), language
     args = {} if language is GithubObject.NotSet else {
         "language": language
     }
     return Legacy.PaginatedList(
         "/legacy/repos/search/" + urllib.quote(keyword),
         args,
         self.__requester,
         "repositories",
         Legacy.convertRepo,
         Repository.Repository,
     )
Example #11
0
 def legacy_search_repos(self, keyword, language=github.GithubObject.NotSet):
     """
     :calls: `GET /legacy/repos/search/:keyword <http://developer.github.com/v3/search/legacy>`_
     :param keyword: string
     :param language: string
     :rtype: :class:`github.PaginatedList.PaginatedList` of :class:`github.Repository.Repository`
     """
     assert isinstance(keyword, (str, unicode)), keyword
     assert language is github.GithubObject.NotSet or isinstance(language, (str, unicode)), language
     args = {} if language is github.GithubObject.NotSet else {"language": language}
     return Legacy.PaginatedList(
         "/legacy/repos/search/" + urllib.quote_plus(keyword, safe='/%:><'),
         args,
         self.__requester,
         "repositories",
         Legacy.convertRepo,
         github.Repository.Repository,
     )
Example #12
0
    def _extractLegacy(self):
        self.log.debug("parsing legacy U-Boot image in %s", self.path)
        p = Legacy.Parser(path=self.path, log=self.log)

        if p.ih_type != Legacy.Parser.IH_TYPE_MULTI:
            raise ValueError("not a multi-file image")

        if p.ih_os != Legacy.Parser.IH_OS_LINUX:
            raise ValueError("invalid OS code")

        sz, off = p.images[1]
        # assume the initrd is the second of three images

        with open(self.path) as fd:
            self.log.debug("reading initrd at [%x:%x]", off, off + sz)
            fd.seek(off, 0)
            buf = fd.read(sz)

        fno, self.initrd = tempfile.mkstemp(prefix="initrd-", suffix=".img")
        self.log.debug("+ cat > %s", self.initrd)
        with os.fdopen(fno, "w") as fd:
            fd.write(buf)
Example #13
0
import Legacy

Legacy.runlegacyapp("Files-legacy.py")
Example #14
0
import Legacy

Legacy.runlegacyapp("Grapher-legacy.py")
Example #15
0
class BucketVerseSummaryTable:
    def __init__(self, config, db):
        self.config = config
        self.legacy = Legacy(config)
        self.db = db

    def process(self):
        self.createSummaryTable()
        self.insertBucketSummary()
        self.insertVerseSummary()
        self.createIndexes()

    ## The pkey assumes that a fileset can have multiple bibles.
    def createSummaryTable(self):
        self.db.execute("DROP TABLE IF EXISTS bucket_verse_summary", None)
        sql = ("CREATE TABLE bucket_verse_summary (" +
               " fileset_id varchar(255) not null," +
               " asset_id varchar(255) not null," +
               " set_type_code varchar(255) not null," +
               " bible_id varchar(255) not null," +
               " legacy_asset_id varchar(255) not null," +
               " hash_id varchar(255) not null," +
               " PRIMARY KEY (fileset_id, asset_id, set_type_code, bible_id))")
        self.db.execute(sql, None)
        print("bucket_verse_summary created")

    def insertBucketSummary(self):
        sql = (
            "INSERT INTO bucket_verse_summary" +
            " SELECT distinct fileset_id, asset_id, set_type_code, bible_id, legacy_asset_id, hash_id"
            + " FROM bucket_listing")
        self.db.execute(sql, None)
        print("bucket rows inserted")

    def insertVerseSummary(self):
        results = []
        verses = VersesReader(self.config)
        bibleFilesets = verses.bibleIdFilesetId()
        for bibleFileset in bibleFilesets:
            parts = bibleFileset.split("/")
            bibleId = parts[0]
            filesetId = parts[1]
            setTypeCode = "text_plain"
            assetId = "db"
            legacyAssetId = self.legacy.legacyAssetId(filesetId, setTypeCode,
                                                      assetId)
            hashId = self.legacy.hashId(legacyAssetId, filesetId, setTypeCode)
            results.append((filesetId, assetId, setTypeCode, bibleId,
                            legacyAssetId, hashId))
        self.db.executeBatch(
            "INSERT INTO bucket_verse_summary (fileset_id, asset_id, set_type_code, bible_id, legacy_asset_id, hash_id) VALUES (%s, %s, %s, %s, %s, %s)",
            results)
        print("num %d verse rows inserted" % (len(results)))

    def createIndexes(self):
        ## This is redundant of primary key, if that is kept in
        self.db.execute(
            "CREATE INDEX bucket_verse_summary_bible_id ON bucket_verse_summary (bible_id)",
            None)
        ## If multiple bibles per fileset should not be allowed, then this can be unique
        self.db.execute(
            "CREATE INDEX bucket_verse_summary_bible_hash_id ON bucket_verse_summary (hash_id)",
            None)
        print("indexes created")
Example #16
0
class BucketListingTable:

	def __init__(self, config, db):
		self.config = config
		self.db = db
		self.lookup = LookupTables()
		self.legacy = Legacy(config)
		self.VIDEO_BOOK_SET = {"MAT","MRK","LUK","JHN"}
		self.VIDEO_BOOK_MAP = {"Mark": "MRK", "MRKZ": "MRK", "Luke": "LUK"}


	def process(self):
		self.createBucketTable()
		self.insertBucketList("dbp-prod")
		self.insertBucketList("dbp-vid")
		self.createIndexes()


	def createBucketTable(self):
		self.db.execute("DROP TABLE IF EXISTS bucket_listing", None)
		sql = ("CREATE TABLE bucket_listing ("
			+ " asset_id varchar(255) not null,"
			+ " type_code varchar(255) not null,"
			+ " bible_id varchar(255) not null,"
			+ " fileset_id varchar(255) not null,"
			+ " file_name varchar(255) not null,"
			+ " set_type_code varchar(255) not null,"
			+ " legacy_asset_id varchar(255) not null,"
			+ " hash_id varchar(255) not null,"
			+ " book_id char(3) NULL,"
			+ " chapter_start varchar(255) NULL,"
			+ " verse_start varchar(255) NULL,"
			+ " verse_end varchar(255) NULL)")
		self.db.execute(sql, None)


	def insertBucketList(self, bucketName):
		results = []
		dropTypes = set()
		dropBibleIds = set()
		dropAudioIds = set()
		dropTextIds = set()
		dropVideoIds = set()
		bucketPath = self.config.directory_bucket_list % (bucketName.replace("-", "_"))
		files = io.open(bucketPath, mode="r", encoding="utf-8")
		for line in files:
			if "delete" not in line:
				parts = line.strip().split("/")
				if len(parts) == 4:
					typeCode = parts[0]
					bibleId = parts[1]
					filesetId = parts[2]
					fileName = parts[3]
					fileNameSansExt = fileName.split(".")[0]
					row = (bucketName, typeCode, bibleId, filesetId, fileName)
					if bibleId.isupper():
						if typeCode == "audio":
							if fileName.endswith(".mp3"):
								if filesetId.isupper():
									setTypeCode = self.setTypeCode(filesetId)
									legacyAssetId = self.legacy.legacyAssetId(filesetId, setTypeCode, bucketName)
									hashId = self.legacy.hashId(legacyAssetId, filesetId, setTypeCode)
									extra = (setTypeCode, legacyAssetId, hashId)
									fileParts = self.parseAudioFilename(fileNameSansExt)
									results.append(row + extra + fileParts)
								else:
									dropAudioIds.add("audio/%s/%s" % (bibleId, filesetId))
						elif typeCode == "text":
							if fileName.endswith(".html"):
								if filesetId.isupper():
									if fileNameSansExt not in {"index", "about"}:
										setTypeCode = "text_format"
										legacyAssetId = self.legacy.legacyAssetId(filesetId, setTypeCode, bucketName)
										hashId = self.legacy.hashId(legacyAssetId, filesetId, setTypeCode)
										extra = (setTypeCode, legacyAssetId, hashId)
										fileParts = self.parseTextFilenames(fileNameSansExt)
										results.append(row + extra + fileParts)
								else:
									dropTextIds.add("text/%s/%s" % (bibleId, filesetId))
						elif typeCode == "video":
							if (fileName.endswith(".mp4") and not fileName.endswith("web.mp4") 
								and not filesetId.endswith("480") and not filesetId.endswith("720")):
								if filesetId.isupper():
									setTypeCode = "video_stream"
									legacyAssetId = self.legacy.legacyAssetId(filesetId, setTypeCode, bucketName)
									hashId = self.legacy.hashId(legacyAssetId, filesetId, setTypeCode)
									extra = (setTypeCode, legacyAssetId, hashId)
									fileParts = self.parseVideoFilenames(fileNameSansExt)
									results.append(row + extra + fileParts)
								else:
									dropVideoIds.add("video/%s/%s" % (bibleId, filesetId))
						else:
							dropTypes.add(typeCode)
					else:
						dropBibleIds.add("%s/%s" % (typeCode, bibleId))
		warningPathName = "output/BucketListing_%s.text" % (bucketName)
		output = io.open(warningPathName, mode="w", encoding="utf-8")
		self.privateDrop(output, "WARNING: type_code %s was excluded", dropTypes)
		self.privateDrop(output, "WARNING: bible_id %s was excluded", dropBibleIds)
		self.privateDrop(output, "WARNING: audio_id %s was excluded", dropAudioIds)
		self.privateDrop(output, "WARNING: text_id %s was excluded", dropTextIds)
		self.privateDrop(output, "WARNING: video_id %s was excluded", dropVideoIds)
		output.close()
		print("%d rows to insert" % (len(results)))
		self.db.executeBatch("INSERT INTO bucket_listing VALUES (%s, %s, %s, %s, %s, %s, %s, %s, %s, %s, %s, %s)", results)


	def createIndexes(self):
		self.db.execute("CREATE INDEX bucket_listing_bible_id ON bucket_listing (bible_id)", None)
		self.db.execute("CREATE INDEX bucket_listing_fileset_id ON bucket_listing (fileset_id, asset_id, set_type_code)", None)
		self.db.execute("CREATE INDEX bucket_listing_hash_id ON bucket_listing (hash_id, book_id, chapter_start, verse_start)", None)
		self.db.execute("CREATE INDEX bucket_listing_prefix ON bucket_listing (type_code, bible_id, fileset_id)", None)


	def privateDrop(self, output, message, dropIds):
		print("num %d:  %s" % (len(dropIds), message))
		message += "\n"
		sortedIds = sorted(list(dropIds))
		for dropId in sortedIds:
			output.write(message % (dropId))


	def setTypeCode(self, filesetId):
		code = filesetId[7:9]
		if code == "1D":
			return "audio"
		elif code == "2D":
			return "audio_drama"
		else:
			code = filesetId[8:10]
			if code == "1D":
				return "audio"
			elif code == "2D":
				return "audio_drama"
			elif filesetId == "N1TUVDPI":
				return "audio"
			elif filesetId == "O1TUVDPI":
				return "audio"
			else:
				print("WARNING: file type not known for %s, set_type_code set to 'unknown'" % (filesetId))
				return "unknown"


	def parseAudioFilename(self, fileName):
		seqCode = fileName[0:3]
		bookCode = self.lookup.bookIdBySequence(seqCode)
		if bookCode == None:
			chapterStart = "1"
		else:
			chapterStart = fileName[5:8].strip("_")
			if not chapterStart.isdigit():
				bookCode = None
				chapterStart = "1"
		verseStart = "1"
		verseEnd = None
		return (bookCode, chapterStart, verseStart, verseEnd)


	def parseTextFilenames(self, fileName):
		#{fileset}_{seq}_{USFM3}_{chapter}.html (chapter optional)
		#{USFM2}{chapter}.html (chapter optional)
		parts = fileName.split("_")
		if len(parts) > 2:
			bookCode = parts[2]
			chapterStart = parts[3] if len(parts) > 3 else "0"
		else:
			bookCode = self.lookup.bookIdBy2Char(fileName[:2])
			if bookCode == None:
				chapterStart = "1"
			else:
				chapterStart = fileName[2:].strip("_")
				if chapterStart == "":
					chapterStart = "0"
		verseStart = "1"
		verseEnd = None
		return (bookCode, chapterStart, verseStart, verseEnd)


	def parseVideoFilenames(self, fileName):
		parts = re.split("[_-]", fileName)
		seqCode = fileName[0:3]
		bookCode = self.lookup.bookIdBySequence(seqCode)
		if bookCode != None:
			chapterStart = fileName[5:8].strip("_")
			verseStart = "1"
			verseEnd = None
		else:
			chapterStart = "1"
			verseStart = "1"
			verseEnd = None
			for index in range(len(parts)):
				part = parts[index]
				if len(part) == 3 and part in self.VIDEO_BOOK_SET:
					bookCode = part
				elif len(part) == 4 and part in self.VIDEO_BOOK_MAP.keys():
					bookCode = self.VIDEO_BOOK_MAP[part]
				if bookCode != None:
					chapterStart = parts[index + 1]
					if chapterStart.isdigit():
						verseStart = parts[index + 2] if len(parts) > (index + 2) else "1"
						verseEnd = parts[index + 3] if len(parts) > (index + 3) else None
					break
		return (bookCode, chapterStart, verseStart, verseEnd)
Example #17
0
 def __init__(self, config, db):
     self.config = config
     self.legacy = Legacy(config)
     self.db = db