Skip to content

Commit 48f6fca

Browse files
committed
Integrate Diagon SDK for managed profiler
- include new SDK google-cloud-mldiagnostics - add new config params - modify profiler.py to add ML run and profiling - modify metrics_logger.py to upload metrics
1 parent 58dba0a commit 48f6fca

File tree

9 files changed

+199
-92
lines changed

9 files changed

+199
-92
lines changed

base_requirements/requirements.txt

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -8,6 +8,7 @@ flax
88
gcsfs
99
google-api-python-client
1010
google-cloud-aiplatform
11+
google-cloud-mldiagnostics
1112
google-cloud-monitoring
1213
grain[parquet]
1314
huggingface_hub

generated_requirements/cuda12-requirements.txt

Lines changed: 90 additions & 78 deletions
Original file line numberDiff line numberDiff line change
@@ -2,115 +2,121 @@
22
# If you need to modify dependencies, please do so in the host requirements file and run seed-env again.
33

44
absl-py>=2.3.1
5-
aiofiles>=24.1.0
5+
aiofiles>=25.1.0
66
aiohappyeyeballs>=2.6.1
7-
aiohttp>=3.13.0
7+
aiohttp>=3.13.1
88
aiosignal>=1.4.0
9+
annotated-doc>=0.0.3
910
annotated-types>=0.7.0
1011
antlr4-python3-runtime>=4.9.3
1112
anyio>=4.11.0
1213
aqtp>=0.9.0
1314
array-record>=0.8.1
14-
astroid>=3.3.11
15+
astroid>=4.0.1
1516
astunparse>=1.6.3
16-
attrs>=25.3.0
17-
auditwheel>=6.4.1
17+
attrs>=25.4.0
18+
auditwheel>=6.4.2
1819
black>=24.10.0
1920
blobfile>=3.1.0
20-
build>=1.2.2.post1
21-
cachetools>=6.2.0
21+
build>=1.3.0
22+
cachetools>=6.2.1
2223
certifi>=2025.10.5
23-
cffi>=2.0.0 ; platform_python_implementation == 'PyPy'
2424
cfgv>=3.4.0
25-
charset-normalizer>=3.4.3
26-
chex>=0.1.90
25+
charset-normalizer>=3.4.4
26+
cheroot>=11.0.0
27+
chex>=0.1.91
2728
click>=8.3.0
2829
cloud-accelerator-diagnostics>=0.1.1
2930
cloud-tpu-diagnostics>=0.1.5
3031
cloudpickle>=3.1.1
3132
clu>=0.0.12
3233
colorama>=0.4.6
33-
contourpy>=1.3.2
34-
coverage>=7.10.7
34+
contourpy>=1.3.3
35+
coverage>=7.11.0
3536
cycler>=0.12.1
36-
datasets>=4.2.0
37+
datasets>=4.3.0
3738
decorator>=5.2.1
3839
dill>=0.4.0
3940
distlib>=0.4.0
4041
dm-tree>=0.1.9
4142
docstring-parser>=0.17.0
4243
editdistance>=0.8.1
4344
einops>=0.8.1
45+
einshape>=1.0
4446
etils>=1.13.0
4547
evaluate>=0.4.6
4648
execnet>=2.1.1
47-
fastapi>=0.118.2
48-
filelock>=3.18.0
49-
flatbuffers>=25.2.10
50-
flax>=0.11.2
51-
fonttools>=4.59.0
49+
fastapi>=0.120.0
50+
filelock>=3.20.0
51+
flatbuffers>=25.9.23
52+
flax>=0.12.0
53+
fonttools>=4.60.1
5254
frozenlist>=1.8.0
53-
fsspec>=2025.7.0
55+
fsspec>=2025.9.0
5456
gast>=0.6.0
55-
gcsfs>=2025.7.0
56-
google-api-core>=2.26.0
57-
google-api-python-client>=2.184.0
57+
gcsfs>=2025.9.0
58+
google-api-core>=2.27.0
59+
google-api-python-client>=2.185.0
5860
google-auth-httplib2>=0.2.0
5961
google-auth-oauthlib>=1.2.2
6062
google-auth>=2.41.1
61-
google-cloud-aiplatform>=1.120.0
62-
google-cloud-appengine-logging>=1.6.2
63-
google-cloud-audit-log>=0.3.3
63+
google-benchmark>=1.9.4
64+
google-cloud-aiplatform>=1.122.0
65+
google-cloud-appengine-logging>=1.7.0
66+
google-cloud-audit-log>=0.4.0
6467
google-cloud-bigquery>=3.38.0
6568
google-cloud-core>=2.4.3
6669
google-cloud-logging>=3.12.1
67-
google-cloud-monitoring>=2.27.2
68-
google-cloud-resource-manager>=1.14.2
70+
google-cloud-mldiagnostics>=0.3.1
71+
google-cloud-monitoring>=2.28.0
72+
google-cloud-resource-manager>=1.15.0
6973
google-cloud-storage>=2.19.0
7074
google-crc32c>=1.7.1
71-
google-genai>=1.42.0
75+
google-genai>=1.46.0
7276
google-pasta>=0.2.0
7377
google-resumable-media>=2.7.2
74-
googleapis-common-protos>=1.70.0
75-
grain>=0.2.12
76-
grpc-google-iam-v1>=0.14.2
78+
googleapis-common-protos>=1.71.0
79+
grain>=0.2.13
80+
grpc-google-iam-v1>=0.14.3
7781
grpcio-status>=1.71.2
7882
grpcio>=1.75.1
7983
gviz-api>=1.10.0
8084
h11>=0.16.0
81-
h5py>=3.14.0
85+
h5py>=3.15.1
8286
hf-xet>=1.1.10 ; platform_machine == 'aarch64' or platform_machine == 'amd64' or platform_machine == 'arm64' or platform_machine == 'x86_64'
8387
httpcore>=1.0.9
8488
httplib2>=0.31.0
8589
httpx>=0.28.1
86-
huggingface-hub>=0.35.3
87-
humanize>=4.13.0
88-
hypothesis>=6.136.4
90+
huggingface-hub>=0.36.0
91+
humanize>=4.14.0
92+
hypothesis>=6.142.1
8993
identify>=2.6.15
90-
idna>=3.10
91-
immutabledict>=4.2.1
94+
idna>=3.11
95+
immutabledict>=4.2.2
9296
importlab>=0.8.1
9397
importlib-metadata>=8.7.0
9498
importlib-resources>=6.5.2
9599
iniconfig>=2.1.0
96-
isort>=6.1.0
97-
jax-cuda12-pjrt>=0.7.0, !=0.7.1, !=0.7.2 ; sys_platform == 'linux'
98-
jax-cuda12-plugin>=0.7.0, !=0.7.1, !=0.7.2 ; sys_platform == 'linux'
99-
jax>=0.7.0, !=0.7.1, !=0.7.2
100-
jaxlib>=0.7.0, !=0.7.1, !=0.7.2
100+
isort>=7.0.0
101+
jaraco-functools>=4.3.0
102+
jax-cuda12-pjrt>=0.8.0 ; sys_platform == 'linux'
103+
jax-cuda12-plugin>=0.8.0 ; sys_platform == 'linux'
104+
jax-triton>=0.3.0
105+
jax>=0.8.0
106+
jaxlib>=0.8.0
101107
jaxtyping>=0.3.3
102108
jinja2>=3.1.6
103109
joblib>=1.5.2
104110
jsonlines>=4.0.0
105111
keras>=3.11.3
106-
kiwisolver>=1.4.8
112+
kiwisolver>=1.4.9
107113
libclang>=18.1.1
108114
libcst>=1.8.5
109115
lxml>=6.0.2
110-
markdown-it-py>=3.0.0
116+
markdown-it-py>=4.0.0
111117
markdown>=3.9
112118
markupsafe>=3.0.3
113-
matplotlib>=3.10.3
119+
matplotlib>=3.10.7
114120
mccabe>=0.7.0
115121
mdurl>=0.1.2
116122
ml-collections>=1.1.0
@@ -129,32 +135,34 @@ networkx>=3.5
129135
ninja>=1.13.0
130136
nltk>=3.9.2
131137
nodeenv>=1.9.1
138+
numpy-typing-compat>=20250818.2.0
132139
numpy>=2.0.2
133-
nvidia-cublas-cu12>=12.9.1.4
134-
nvidia-cuda-cupti-cu12>=12.9.79
135-
nvidia-cuda-nvcc-cu12>=12.9.86
140+
nvidia-cublas-cu12>=12.9.1.4 ; sys_platform == 'linux'
141+
nvidia-cuda-cupti-cu12>=12.9.79 ; sys_platform == 'linux'
142+
nvidia-cuda-nvcc-cu12>=12.9.86 ; sys_platform == 'linux'
136143
nvidia-cuda-nvrtc-cu12>=12.9.86 ; sys_platform == 'linux'
137-
nvidia-cuda-runtime-cu12>=12.9.79
138-
nvidia-cudnn-cu12>=9.11.0.98
139-
nvidia-cufft-cu12>=11.4.1.4
140-
nvidia-cusolver-cu12>=11.7.5.82
141-
nvidia-cusparse-cu12>=12.5.10.65
142-
nvidia-nccl-cu12>=2.27.6
143-
nvidia-nvjitlink-cu12>=12.9.86
144-
nvidia-nvshmem-cu12>=3.3.9 ; sys_platform == 'linux'
144+
nvidia-cuda-runtime-cu12>=12.9.79 ; sys_platform == 'linux'
145+
nvidia-cudnn-cu12>=9.14.0.64 ; sys_platform == 'linux'
146+
nvidia-cufft-cu12>=11.4.1.4 ; sys_platform == 'linux'
147+
nvidia-cusolver-cu12>=11.7.5.82 ; sys_platform == 'linux'
148+
nvidia-cusparse-cu12>=12.5.10.65 ; sys_platform == 'linux'
149+
nvidia-nccl-cu12>=2.28.3 ; sys_platform == 'linux'
150+
nvidia-nvjitlink-cu12>=12.9.86 ; sys_platform == 'linux'
151+
nvidia-nvshmem-cu12>=3.4.5 ; sys_platform == 'linux'
145152
oauthlib>=3.3.1
146153
omegaconf>=2.3.0
147-
opentelemetry-api>=1.37.0
154+
opentelemetry-api>=1.38.0
148155
opt-einsum>=3.4.0
149156
optax>=0.2.6
150157
optree>=0.17.0
151-
orbax-checkpoint>=0.11.25
158+
optype>=0.14.0
159+
orbax-checkpoint>=0.11.26
152160
packaging>=25.0
153161
pandas>=2.3.3
154162
parameterized>=0.9.0
155163
pathspec>=0.12.1
156164
pathwaysutils>=0.1.3
157-
pillow>=11.3.0
165+
pillow>=12.0.0
158166
platformdirs>=4.5.0
159167
pluggy>=1.6.0
160168
portpicker>=1.6.0
@@ -164,37 +172,37 @@ promise>=2.3
164172
propcache>=0.4.1
165173
proto-plus>=1.26.1
166174
protobuf>=5.29.5
167-
psutil>=7.0.0
168-
pyarrow>=21.0.0
175+
psutil>=7.1.0
176+
pyarrow>=22.0.0
169177
pyasn1-modules>=0.4.2
170178
pyasn1>=0.6.1
171179
pycnite>=2024.7.31
172-
pycparser>=2.23 ; implementation_name != 'PyPy' and platform_python_implementation == 'PyPy'
173180
pycryptodomex>=3.23.0
174-
pydantic-core>=2.41.1
175-
pydantic>=2.12.0
181+
pydantic-core>=2.41.4
182+
pydantic>=2.12.3
176183
pydot>=4.0.1
177184
pyelftools>=0.32
178185
pyglove>=0.4.5
179186
pygments>=2.19.2
180187
pyink>=24.10.1
181-
pylint>=3.3.9
182-
pyparsing>=3.2.3
188+
pylint>=4.0.2
189+
pyparsing>=3.2.5
183190
pyproject-hooks>=1.2.0
184191
pytest-xdist>=3.8.0
185-
pytest>=8.4.1
192+
pytest>=8.4.2
186193
python-dateutil>=2.9.0.post0
187194
pytype>=2024.10.11
188195
pytz>=2025.2
189196
pyyaml>=6.0.3
190197
qwix>=0.1.1
191-
regex>=2025.9.18
198+
regex>=2025.10.23
192199
requests-oauthlib>=2.0.0
193200
requests>=2.32.5
194-
rich>=14.1.0
201+
rich>=14.2.0
195202
rsa>=4.9.1
196203
safetensors>=0.6.2
197-
scipy>=1.16.0
204+
scipy-stubs>=1.16.2.4
205+
scipy>=1.16.2
198206
sentencepiece>=0.2.1
199207
seqio>=0.0.20
200208
setuptools>=80.9.0
@@ -217,32 +225,36 @@ tensorflow-datasets>=4.9.9
217225
tensorflow-metadata>=1.17.2
218226
tensorflow-text>=2.19.0
219227
tensorflow>=2.19.1
220-
tensorstore>=0.1.76
228+
tensorstore>=0.1.78
221229
termcolor>=3.1.0
222230
tiktoken>=0.12.0
231+
tokamax>=0.0.4
223232
tokenizers>=0.22.1
224233
toml>=0.10.2
225234
tomlkit>=0.13.3
226-
toolz>=1.0.0
235+
toolz>=1.1.0
227236
tqdm>=4.67.1
228237
transformer-engine-cu12>=2.8.0
229238
transformer-engine-jax>=2.8.0
230239
transformer-engine>=2.8.0
231-
transformers>=4.57.0
240+
transformers>=4.57.1
232241
treescope>=0.1.10
233-
typing-extensions>=4.14.1
242+
triton>=3.5.0
243+
typeguard>=2.13.3
244+
typing-extensions>=4.15.0
234245
typing-inspection>=0.4.2
235246
tzdata>=2025.2
236247
uritemplate>=4.2.0
237248
urllib3>=2.5.0
238-
uvicorn>=0.37.0
239-
virtualenv>=20.34.0
249+
uvicorn>=0.38.0
250+
virtualenv>=20.35.3
240251
wadler-lindig>=0.1.7
241252
websockets>=15.0.1
242253
werkzeug>=3.1.3
243254
wheel>=0.45.1
244-
wrapt>=1.17.3
255+
wrapt>=2.0.0
256+
xprof>=2.20.7
245257
xxhash>=3.6.0
246258
yarl>=1.22.0
247259
zipp>=3.23.0
248-
zstandard>=0.23.0
260+
zstandard>=0.25.0

0 commit comments

Comments
 (0)