diff --git a/datasets/mnist/README.md b/datasets/mnist/README.md new file mode 100644 index 00000000000..9a05178b13d --- /dev/null +++ b/datasets/mnist/README.md @@ -0,0 +1,146 @@ +--- +annotations_creators: +- experts +language_creators: +- found +languages: [] +licenses: +- MIT +multilinguality: [] +size_categories: +- 10KI", f.read(4))[0] + _ = f.read(8) + images = np.frombuffer(f.read(), dtype=np.uint8).reshape(size, 28, 28) + + # Labels + with open(filepath[1], "rb") as f: + # First 8 bytes contain some metadata + _ = f.read(8) + labels = np.frombuffer(f.read(), dtype=np.uint8) + + for idx in range(size): + yield idx, {"image": images[idx], "label": str(labels[idx])}