Skip to content

Instantly share code, notes, and snippets.

@theSoberSobber
Created May 12, 2024 20:04
Show Gist options
  • Save theSoberSobber/ac721d0e97637bd08ffa7ac11d068d3f to your computer and use it in GitHub Desktop.
Save theSoberSobber/ac721d0e97637bd08ffa7ac11d068d3f to your computer and use it in GitHub Desktop.
Uploads a folder named test to drive with tag support, creates an index.json in the same directory, tags are to be supplied as meow,,cat,,animal,,pet.txt here meow.txt will be the name of the file and all others will be tags.
import os
from Google import Create_Service
from googleapiclient.http import MediaFileUpload
import hashlib
import json
API_NAME = 'drive'
API_VERSION = 'v3'
SCOPES = ['https://www.googleapis.com/auth/drive']
service = Create_Service("client_secret_akshat.json", API_NAME, API_VERSION, SCOPES)
print(service)
# file_path = 'test.txt'
# parent_folder_id = 'root'
# file_metadata = {
# 'name': os.path.basename(file_path),
# 'parents': [parent_folder_id]
# }
# media = MediaFileUpload(file_path)
# uploaded_file = service.files().create(
# body=file_metadata,
# media_body=media,
# fields='id, webViewLink'
# ).execute()
# print("File uploaded successfully.")
# print("File ID:", uploaded_file['id'])
# print("File link:", uploaded_file['webViewLink'])
def upload_internal(name, file_path):
file_metadata = {
'name': name,
'parents': ["root"]
}
media = MediaFileUpload(file_path)
uploaded_file = service.files().create(
body=file_metadata,
media_body=media,
fields='id, webViewLink'
).execute()
# print("File uploaded successfully.")
return uploaded_file['id'], uploaded_file['webViewLink']
def calculate_file_hash(file_path):
"""Calculate the SHA-256 hash of a file."""
sha256_hash = hashlib.sha256()
with open(file_path, "rb") as file:
# Read the file in chunks to avoid loading the entire file into memory
chunk = 0
while chunk := file.read(4096):
sha256_hash.update(chunk)
return sha256_hash.hexdigest()
def extract_tags(filename):
# Extract tags from filename
name, ext = os.path.splitext(filename)
tags = name.split(',,')[1:]
name = name.split(',,')[:1][0].split("\\")[-1]
# print(f"Tags extracted from filename {name}: {tags}")
return name + ext, tags
# print(extract_tags("test/meow,,kitten,,cat,,animal,,pet.txt"))
def upload(file_path):
# file_path = "test/meow,,kitten,,cat,,animal,,pet.txt"
name, tags = extract_tags(file_path)
_, link = upload_internal(name, file_path)
return name, link, tags
index = {}
directory = "test"
for root, dirs, files in os.walk(directory):
for file in files:
file_path = os.path.join(root, file)
if os.path.isfile(file_path):
name, link, tags = upload(file_path)
hash = calculate_file_hash(file_path)
index[hash] = {"name": name, "link": link, "tags": tags}
with open("index.json", 'w') as f:
json.dump(index, f, indent=4)
@theSoberSobber
Copy link
Author

theSoberSobber commented May 12, 2024

with hash and stop pickup

import os
from Google import Create_Service
from googleapiclient.http import MediaFileUpload
import hashlib
import json

API_NAME = 'drive'
API_VERSION = 'v3'
SCOPES = ['https://www.googleapis.com/auth/drive']

service = Create_Service("client_secret_akshat.json", API_NAME, API_VERSION, SCOPES)

print(service)

data = None

if os.path.exists('index.json'):
    with open('index.json', 'r') as file:
        data = json.load(file)

# file_path = 'test.txt'
# parent_folder_id = 'root'

# file_metadata = {
#     'name': os.path.basename(file_path),
#     'parents': [parent_folder_id]
# }

# media = MediaFileUpload(file_path)

# uploaded_file = service.files().create(
#     body=file_metadata,
#     media_body=media,
#     fields='id, webViewLink'
# ).execute()
# print("File uploaded successfully.")
# print("File ID:", uploaded_file['id'])
# print("File link:", uploaded_file['webViewLink'])

def upload_internal(name, file_path):
    file_metadata = {
        'name': name,
        'parents': ["root"]
    }
    media = MediaFileUpload(file_path)
    uploaded_file = service.files().create(
        body=file_metadata,
        media_body=media,
        fields='id, webViewLink'
    ).execute()
    # print("File uploaded successfully.")
    return uploaded_file['id'], uploaded_file['webViewLink']

def calculate_file_hash(file_path):
    """Calculate the SHA-256 hash of a file."""
    sha256_hash = hashlib.sha256()
    with open(file_path, "rb") as file:
        # Read the file in chunks to avoid loading the entire file into memory
        chunk = 0
        while chunk := file.read(4096):
            sha256_hash.update(chunk)
    return sha256_hash.hexdigest()

def extract_tags(filename):
    # Extract tags from filename
    name, ext = os.path.splitext(filename)
    tags = name.split(',,')[1:]
    name = name.split(',,')[:1][0].split("\\")[-1]
    # print(f"Tags extracted from filename {name}: {tags}")
    return name + ext, tags

# print(extract_tags("test/meow,,kitten,,cat,,animal,,pet.txt"))

def upload(file_path):
    # file_path = "test/meow,,kitten,,cat,,animal,,pet.txt"
    name, tags = extract_tags(file_path)
    hash = calculate_file_hash(file_path)
    if data and hash in data:
        return hash, data[hash]["name"], data[hash]["link"], data[hash]["tags"]
    _, link = upload_internal(name, file_path)
    return hash, name, link, tags

directory = "test"
for root, dirs, files in os.walk(directory):
    for file in files:
        file_path = os.path.join(root, file)
        if os.path.isfile(file_path):
            hash, name, link, tags = upload(file_path)
            if data and hash in data:
                print(f"File {name} already exists in index.json!")
                continue
            data[hash] = {"name": name, "link": link, "tags": tags}
            print(f"Uploaded {name} Successfully with tags: {tags}!")

with open("index.json", 'w') as f:
    json.dump(data, f, indent=4)
    ```

Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment