From 8ce1856ea194d9bb7682978437963d6d0b90d9d1 Mon Sep 17 00:00:00 2001 From: Allen Xu Date: Fri, 7 Jul 2023 11:54:42 +0800 Subject: [PATCH] resolve comments Signed-off-by: Allen Xu --- nds/README.md | 2 +- nds/nds_transcode.py | 2 +- 2 files changed, 2 insertions(+), 2 deletions(-) diff --git a/nds/README.md b/nds/README.md index 424f102..f216ae0 100644 --- a/nds/README.md +++ b/nds/README.md @@ -141,7 +141,7 @@ The utility requires a pre-defined [template file](./convert_submit_gpu.template necessary Spark configurations. Either user can submit the `nds_transcode.py` directly to spark with arbitrary Spark parameters. -CSV, Parquet and ORC are supported for input data format at present. +CSV is the default input format for data conversion, it can be overridden by `--input_format`. Parquet, Orc, Avro, JSON and Iceberg are supported for output data format at present with CPU. For GPU conversion, only Parquet and Orc are supported. diff --git a/nds/nds_transcode.py b/nds/nds_transcode.py index c5622fa..eef117d 100644 --- a/nds/nds_transcode.py +++ b/nds/nds_transcode.py @@ -1,7 +1,7 @@ #!/usr/bin/env python3 # -*- coding: utf-8 -*- # -# SPDX-FileCopyrightText: Copyright (c) 2022 NVIDIA CORPORATION & AFFILIATES. All rights reserved. +# SPDX-FileCopyrightText: Copyright (c) 2022-2023 NVIDIA CORPORATION & AFFILIATES. All rights reserved. # SPDX-License-Identifier: Apache-2.0 # # Licensed under the Apache License, Version 2.0 (the "License");