#@title from IPython.display import HTML HTML('') ! pip install datasets transformers[sentencepiece] !wget https://archive.ics.uci.edu/ml/machine-learning-databases/wine-quality/winequality-white.csv from datasets import load_dataset local_csv_dataset = load_dataset("csv", data_files="winequality-white.csv", sep=";") local_csv_dataset["train"] # Load the dataset from the URL directly dataset_url = "https://archive.ics.uci.edu/ml/machine-learning-databases/wine-quality/winequality-white.csv" remote_csv_dataset = load_dataset("csv", data_files=dataset_url, sep=";") remote_csv_dataset dataset_url = "https://raw.githubusercontent.com/karpathy/char-rnn/master/data/tinyshakespeare/input.txt" text_dataset = load_dataset("text", data_files=dataset_url) text_dataset["train"][:5] dataset_url = "https://raw.githubusercontent.com/hirupert/sede/main/data/sede/train.jsonl" json_lines_dataset = load_dataset("json", data_files=dataset_url) json_lines_dataset["train"][:2] dataset_url = "https://rajpurkar.github.io/SQuAD-explorer/dataset/train-v2.0.json" json_dataset = load_dataset("json", data_files=dataset_url, field="data") json_dataset url = "https://rajpurkar.github.io/SQuAD-explorer/dataset/" data_files = {"train": f"{url}train-v2.0.json", "validation": f"{url}dev-v2.0.json"} json_dataset = load_dataset("json", data_files=data_files, field="data") json_dataset