Skip to content

Commit

Permalink
Add log information for gpu collector (microsoft#3506)
Browse files Browse the repository at this point in the history
  • Loading branch information
SparkSnail authored and Hao Ni committed Apr 7, 2021
1 parent aa42ddd commit 876a366
Show file tree
Hide file tree
Showing 2 changed files with 4 additions and 2 deletions.
3 changes: 2 additions & 1 deletion ts/nni_manager/training_service/common/gpuData.ts
Original file line number Diff line number Diff line change
Expand Up @@ -79,6 +79,7 @@ export function parseGpuIndices(gpuIndices?: string): Set<number> | undefined {
export const GPU_INFO_COLLECTOR_FORMAT_WINDOWS: string =
`
$env:METRIC_OUTPUT_DIR="{0}"
$app = Start-Process "python" -ArgumentList "-m nni.tools.gpu_tool.gpu_metrics_collector" -passthru -NoNewWindow
$app = Start-Process "python" -ArgumentList "-m nni.tools.gpu_tool.gpu_metrics_collector" -passthru -NoNewWindow \
-redirectStandardOutput {0}\\stdout -redirectStandardError {0}\\stderr
Write $app.ID | Out-File {1} -NoNewline -encoding utf8
`;
3 changes: 2 additions & 1 deletion ts/nni_manager/training_service/common/util.ts
Original file line number Diff line number Diff line change
Expand Up @@ -236,7 +236,8 @@ export function getScriptName(fileNamePrefix: string): string {
}

export function getGpuMetricsCollectorBashScriptContent(scriptFolder: string): string {
return `echo $$ > ${scriptFolder}/pid ; METRIC_OUTPUT_DIR=${scriptFolder} python3 -m nni.tools.gpu_tool.gpu_metrics_collector`;
return `echo $$ > ${scriptFolder}/pid ; METRIC_OUTPUT_DIR=${scriptFolder} python3 -m nni.tools.gpu_tool.gpu_metrics_collector \
1>${scriptFolder}/stdout 2>${scriptFolder}/stderr`;
}

export function runGpuMetricsCollector(scriptFolder: string): void {
Expand Down

0 comments on commit 876a366

Please sign in to comment.