update kernel dataset to exclude the disktensor ones (#3651)

disk tensor load contains big offset and is not meant to be run by gpu.

repro steps
```
time ./extra/optimization/generate_dataset.sh
gzip /tmp/sops
mv /tmp/sops.gz extra/datasets/
```
This commit is contained in:
chenyu
2024-03-07 17:35:19 -05:00
committed by GitHub
parent fcf4a5ccf2
commit a66ffec6d3
3 changed files with 4 additions and 4 deletions

Binary file not shown.

View File

@@ -12,9 +12,9 @@ WINO=1 STEPS=3 python3 examples/hlb_cifar10.py
python3 examples/stable_diffusion.py --noshow
python3 examples/llama.py --prompt "hello" --count 5
python3 examples/gpt2.py --count 5
python3 HALF=1 examples/gpt2.py --count 5
python3 python examples/beautiful_mnist.py
python3 python examples/beautiful_cartpole.py
HALF=1 python3 examples/gpt2.py --count 5
python3 examples/beautiful_mnist.py
python3 examples/beautiful_cartpole.py
python3 examples/mlperf/model_spec.py
python3 examples/yolov8.py ./test/models/efficientnet/Chicken.jpg
openpilot/go.sh

View File

@@ -50,7 +50,7 @@ logops = open(getenv("LOGOPS", ""), "a") if getenv("LOGOPS", "") else None
def run_schedule(schedule:List[ScheduleItem]):
while len(schedule):
si = schedule.pop(0)
if logops and si.ast.op not in LoadOps: logops.write(str(si.ast)+"\n")
if logops and si.ast.op not in LoadOps and not any(i.device.startswith("DISK:") for i in si.inputs): logops.write(str(si.ast)+"\n")
# get the program
prg = lower_schedule_item(si)