jacklangerman
/

my_cool_submission_2025

Model card Files Files and versions

xet

Community

jacklangerman commited on Apr 4

Commit

64fb003

verified ·

1 Parent(s): 5483b95

Upload folder using huggingface_hub

Browse files

Files changed (2) hide show

README.md +12 -2
script.py +43 -23

README.md CHANGED Viewed

@@ -1,4 +1,14 @@
-# My Cool Submission 2025
-This repo contains a submission to the [S23DR Challenge](https://huggingface.co/spaces/usm3d/S23DR) (part of the [USM3D](https://usm3d.github.io/) workshop at CVPR2025). It was prepared by [jacklangerman](https://huggingface.co/jacklangerman).

+# Empty solution example for the S23DR competition
+This repo provides a minimalistic example of a valid, but empty submission to S23DR competition.
+We recommend you take a look at [this example](https://huggingface.co/usm3d/handcrafted_baseline_submission),
+which implements some primitive algorithms and provides useful I/O and visualization functions.
+This example seeks to simply provide minimal code which succeeds at reading the dataset and producing a solution (in this case two vertices at the origin and edge of zero length connecting them).
+`script.py` - is the main file which is run by the competition space. It should produce `submission.parquet` as the result of the run. Please see the additional comments in the `script.py` file.
+---
+license: apache-2.0
+---

script.py CHANGED Viewed

@@ -44,46 +44,66 @@ if __name__ == "__main__":
     os.system('pwd')
     print(os.system('ls -lahtr'))
     print('/tmp/data/')
-    print(os.system('ls -lahtrR /tmp/data/'))
     data_path_test_server = Path('/tmp/data')
     data_path_local = Path().home() / '.cache/huggingface/datasets/usm3d___hoho25k_test_x/'
     if data_path_test_server.exists():
-        data_path = data_path_test_server
         TEST_ENV = True
     else:
-        data_path = data_path_local
         TEST_ENV = False
     print(data_path)
     # dataset = load_dataset(params['dataset'], trust_remote_code=True, use_auth_token=params['token'])
     data_files = {
-        "validation": [str(p) for p in [*data_path.rglob('*validation*.arrow')]+[*data_path.rglob('*public*/**/*.tar')]],
-        "test": [str(p) for p in [*data_path.rglob('*test*.arrow')]+[*data_path.rglob('*private*/**/*.tar')]],
     }
     print(data_files)
-    if TEST_ENV:
-        dataset = load_dataset(
-            "webdataset",
-            data_files=data_files,
-            trust_remote_code=True,
-            # streaming=True
-        )
-        print('load with webdataset')
-    else:
-        dataset = load_dataset(
-            "arrow",
-            data_files=data_files,
-            trust_remote_code=True,
-            # streaming=True
-        )
-        print('load with arrow')
     print(dataset, flush=True)

     os.system('pwd')
     print(os.system('ls -lahtr'))
     print('/tmp/data/')
+    print(os.system('ls -lahtr /tmp/data/'))
+    print('/tmp/data/data')
+    print(os.system('ls -lahtrR /tmp/data/data'))
     data_path_test_server = Path('/tmp/data')
     data_path_local = Path().home() / '.cache/huggingface/datasets/usm3d___hoho25k_test_x/'
     if data_path_test_server.exists():
+        # data_path = data_path_test_server
         TEST_ENV = True
     else:
+        # data_path = data_path_local
         TEST_ENV = False
+        from huggingface_hub import snapshot_download
+        _ = snapshot_download(
+            repo_id=params['dataset'],
+            local_dir="/tmp/data",
+            # token=params.token,
+            repo_type="dataset",
+        )
+    data_path = data_path_test_server
     print(data_path)
     # dataset = load_dataset(params['dataset'], trust_remote_code=True, use_auth_token=params['token'])
+    # data_files = {
+    #     "validation": [str(p) for p in [*data_path.rglob('*validation*.arrow')]+[*data_path.rglob('*public*/**/*.tar')]],
+    #     "test": [str(p) for p in [*data_path.rglob('*test*.arrow')]+[*data_path.rglob('*private*/**/*.tar')]],
+    # }
     data_files = {
+        "validation": [str(p) for p in data_path.rglob('*public*/**/*.tar')],
+        "test": [str(p) for p in data_path.rglob('*private*/**/*.tar')],
     }
     print(data_files)
+    dataset = load_dataset(
+        params['dataset'],
+        data_files=data_files,
+        trust_remote_code=True,
+        # streaming=True
+    )
+    # if TEST_ENV:
+    # dataset = load_dataset(
+    #     "webdataset",
+    #     data_files=data_files,
+    #     trust_remote_code=True,
+    #     # streaming=True
+    # )
+    print('load with webdataset')
+    # else:
+    #     dataset = load_dataset(
+    #         "arrow",
+    #         data_files=data_files,
+    #         trust_remote_code=True,
+    #         # streaming=True
+    #     )
+    #     print('load with arrow')
     print(dataset, flush=True)