Crunch-io · Alig1493 · Apr 4, 2024 · Apr 17, 2024 · Apr 24, 2024 · Apr 25, 2024
diff --git a/src/pycrunch/importing.py b/src/pycrunch/importing.py
@@ -52,6 +52,35 @@ def wait_for_batch_status(self, batch, status):
         else:
             raise ValueError("The batch did not reach the '%s' state in the "
                              "given time. Please check again later." % status)
+
+    def add_schema_metadata(self, site, schema, metadata, filename, fp, mimetype="application/x-parquet"):
+        """
+        Create a new Source from a parquet file using schema and metadata.
+
+        Parameters:
+        site (shoji.Catalog): a shoji Catalog object, from which we acquire session and sources url
+        schema (dict): json string containing schema
+        metadata (dict): json string containing metadata
+        filename (str): name of file being uploaded
+        fp (BufferedReader): opened file object
+        mimetype (str): mimetype of file being uploaded
+
+        Returns:
+        shoji.Entity: Shoji entity containing the source url
+        """
+        response = site.session.post(
+            site.catalogs.sources, 
+            files={
+                "uploaded_file": (filename, fp, mimetype)
+            },
+            data={
+                "schema": json.dumps(schema), 
+                "metadata": json.dumps(metadata),
+                "crunchlake": "create",
+                "dataset_id": "None"
+            }
+        )
+        return shoji.Entity(self=response.headers.get("Location"), session=site.session)
 
     def add_source(self, ds, filename, fp, mimetype):
         """Create a new Source on the given dataset and return its URL."""