#!/usr/bin/env python # coding: utf-8 # In[9]: import cricketstats import pandas as pd import numpy as np import requests from pandas.core.frame import DataFrame import json import csv import os import glob import pprint import requests, zipfile from io import BytesIO from urllib.request import urlopen import warnings warnings.filterwarnings("ignore") # In[10]: endpoint ="https://cricsheet.org/downloads/odis_json.zip" response = requests.get(endpoint) html = urlopen(endpoint).read() # In[12]: r = requests.get("https://cricsheet.org/downloads/odis_json.zip", stream=True) z = zipfile.ZipFile(BytesIO(r.content)) z.extractall() type(z) # In[13]: #unzip json file from zipfile import ZipFile # loading the temp.zip and creating a zip object with ZipFile(z, 'r') as zObject: for file_name in file_names: with open(file_name) as f: file_data = json.load(f) # load data from JSON to dict for k, v in file_data.items(): # iterate over key-value pairs collection.insert_one(v) # your collection object here zObject.extractall( path="odis/jsons") # In[ ]: #loop through jsons directory = os.fsencode(r'odis') conn = sqlite3.connect('cricketDB.db') for file in os.listdir(directory): filename = os.fsdecode(file) if filename.endswith(".json"): with open("/Users/catherinedana/Zelus/odis/"+filename, 'r') as json_file: data = json.load(json_file) cat data | jq -r '.data | map([.field1, .field2, .field3] | @csv)| join("\n")' > file.csv # for item in data: # conn.execute("""\ # CREATE TABLE (x BLOB(50))") # conn.execute("INSERT INTO test VALUES (?)", ((item,))) continue else: continue # In[ ]: import os dir_loc = os.getcwd() list_of_dir = os.listdir(dir_loc) for file in list_of_dir: with open(file, 'rb') as f: temp_file = f.read() # Do somethin with the file, it's currently stored in a variable print(temp_file) # I used print # In[33]: keywordList = [] path = '/Users/catherinedana/Zelus/odis' for filename in glob.glob(os.path.join(path, '*.json')): #only process .JSON files in folder. with open(filename, encoding='utf-8', mode='r') as currentFile: data=currentFile.read().replace('\n', '') keyword = json.loads(data) keyword # In[34]: type(keyword) # In[36]: #requests.get('https://cricsheet.org/downloads/odis_json.zip').json() # In[38]: #Read file and print a line webFD=urllib2.urlopen("https://cricsheet.org/downloads/odis_json.zip") tweet = webFD.readline() tweet #create dictionary dictt=json.loads(tweet) #print dictionary dictt.keys() #print values dictt.values() # In[ ]: