Вставьте Google Sheets в фрейм данных Pandas

Я ищу код, который поможет мне автоматически распечатать Excel на листе Google с помощью Python.

Я пробовал несколько кодов, но безуспешно


from __future__ import print_function
import pickle
import os.path
from googleapiclient.discovery import build
from google_auth_oauthlib.flow import InstalledAppFlow
from google.auth.transport.requests import Request



# If modifying these scopes, delete the file token.pickle.
SCOPES = ['https://www.googleapis.com/auth/Dummy Dataset.readonly']

# The ID and range of a sample spreadsheet.
SAMPLE_SPREADSHEET_ID = '1NXenqaum6PHsDBXyv-_tGKIL-z4tSaCsZpUT9Q5wpkY'
SAMPLE_RANGE_NAME = 'Sheet1!A1:L'

def main():
    """Shows basic usage of the Sheets API.
    Prints values from a sample spreadsheet.
    """
    creds = None
    # The file token.pickle stores the user's access and refresh tokens, and is
    # created automatically when the authorization flow completes for the first
    # time.
    if os.path.exists('token.pickle'):
        with open('token.pickle', 'rb') as token:
            creds = pickle.load(token)
    # If there are no (valid) credentials available, let the user log in.
    if not creds or not creds.valid:
        if creds and creds.expired and creds.refresh_token:
            creds.refresh(Request())
        else:
            flow = InstalledAppFlow.from_client_secrets_file(
                'credentials.json', SCOPES)
            creds = flow.run_local_server()
        # Save the credentials for the next run
        with open('token.pickle', 'wb') as token:
            pickle.dump(creds, token)

    service = build('sheets', 'v4', credentials=creds)

    # Call the Sheets API
    sheet = service.spreadsheets()
    result = sheet.values().get(spreadsheetId=SAMPLE_SPREADSHEET_ID,
                                range=SAMPLE_RANGE_NAME).execute()
    values = result.get('values', [])

    if not values:
        print('No data found.')
    else:

        for row in values:
            # Print columns A and E, which correspond to indices 0 and 4.
            print('%s, %s, %s, %s, %s, %s, %s, %s, %s, %s, %s, %s' % (row[0], row[1], row[2], row[3], row[4], row[5], row[6], row[7], row[8], row[9], row[10], row[11]))

if __name__ == '__main__':
main()  

Хотя я могу распечатать лист Google, я не могу сохранить его в кадре данных, чтобы позже распечатать его в книге Excel.


person Siddhant Mehandru    schedule 21.05.2019    source источник


Ответы (2)


Вот как я получил рабочий фрейм данных Google Sheets to Pandas с помощью страницы быстрого запуска Google Python. и статья, которую я нашел на Medium и адаптированная под мои нужды.

# This works in Python 3.6+
from googleapiclient.discovery import build
from google_auth_oauthlib.flow import InstalledAppFlow
from google.auth.transport.requests import Request
import os.path
import pickle
import pandas as pd


SCOPES = ["https://www.googleapis.com/auth/spreadsheets.readonly"]
SPREADSHEET_ID = YOUR_ID_GOES_HERE
RANGE_NAME = YOUR_RANGE_GOES_HERE


def get_google_sheet(spreadsheet_id, range_name):
    """ Retrieve sheet data using OAuth credentials and Google Python API. """
    creds = None
    # The file token.pickle stores the user's access and refresh tokens, and is
    # created automatically when the authorization flow completes for the first
    # time.
    if os.path.exists("token.pickle"):
        with open("token.pickle", "rb") as token:
            creds = pickle.load(token)
    # If there are no (valid) credentials available, let the user log in.
    if not creds or not creds.valid:
        if creds and creds.expired and creds.refresh_token:
            creds.refresh(Request())
        else:
            flow = InstalledAppFlow.from_client_secrets_file("credentials.json", SCOPES)
            creds = flow.run_local_server()
        # Save the credentials for the next run
        with open("token.pickle", "wb") as token:
            pickle.dump(creds, token)
    service = build("sheets", "v4", credentials=creds)

    return (
        service.spreadsheets()
        .values()
        .get(spreadsheetId=spreadsheet_id, range=range_name)
        .execute()
    )


def to_dataframe(gsheet):
    """ Converts Google sheet data to a Pandas DataFrame.
    Note: This script assumes that your data contains a header file on the first row!
    Also note that the Google API returns 'none' from empty cells - in order for the code
    below to work, you'll need to make sure your sheet doesn't contain empty cells,
    or update the code to account for such instances.
    """
    return pd.DataFrame(gsheet.get("values")[1:], columns=gsheet.get("values")[0])
person lalligood    schedule 28.05.2019

Попробуйте следующий код

  1. Шаг 1: перейдите в консоль Google, создайте проект.

  2. Включите сервисы, создайте учетные данные и загрузите файл json.

  3. возьмите client_email, поделитесь своим листом Google на этот адрес электронной почты

  4. попробуйте следующий код

import gspread

from oauth2client.service_account import ServiceAccountCredentials

scope = ["https://spreadsheets.google.com/feeds",'https://www.googleapis.com/auth/spreadsheets',"https://www.googleapis.com/auth/drive.file","https://www.googleapis.com/auth/drive"]
creds = ServiceAccountCredentials.from_json_keyfile_name("YOUR_JSON_FILE_NAME.json", scope)

client = gspread.authorize(creds)

sheet = client.open("GOOGLE_SHEET_NAME").sheet1  # Open the spreadhseet
data = sheet.get_all_records() 

headers = data.pop(0)

df = pd.DataFrame(data, columns=headers)
print(df.head())

Для справки по консоли Google перейдите по следующей ссылке https://medium.com/@vince.shields913/reading-google-sheets-into-a-pandas-dataframe-with-gspread-and-oauth2-375b932be7bf

person Community    schedule 16.06.2021