diff --git a/.pre-commit-config.yaml b/.pre-commit-config.yaml new file mode 100755 index 00000000..d8112837 --- /dev/null +++ b/.pre-commit-config.yaml @@ -0,0 +1,52 @@ +repos: +- repo: https://github.com/Lucas-C/pre-commit-hooks.git + sha: v1.0.1 + hooks: + - id: remove-crlf + files: (?!.*third_party)^.*$ | (?!.*book)^.*$ +- repo: https://github.com/PaddlePaddle/mirrors-yapf.git + sha: 0d79c0c469bab64f7229c9aca2b1186ef47f0e37 + hooks: + - id: yapf + files: (.*\.(py|bzl)|BUILD|.*\.BUILD|WORKSPACE)$ +- repo: https://github.com/pre-commit/pre-commit-hooks + sha: 5bf6c09bfa1297d3692cadd621ef95f1284e33c0 + hooks: + - id: check-added-large-files + - id: check-merge-conflict + - id: check-symlinks + - id: detect-private-key + files: (?!.*third_party)^.*$ | (?!.*book)^.*$ + - id: end-of-file-fixer +- repo: local + hooks: + - id: clang-format-with-version-check + name: clang-format + description: Format files with ClangFormat. + entry: bash ./tools/codestyle/clang_format.hook -i + language: system + files: \.(c|cc|cxx|cpp|cu|h|hpp|hxx|proto)$ +- repo: local + hooks: + - id: cpplint-cpp-source + name: cpplint + description: Check C++ code style using cpplint.py. + entry: bash ./tools/codestyle/cpplint_pre_commit.hook + language: system + files: \.(c|cc|cxx|cpp|cu|h|hpp|hxx)$ +- repo: local + hooks: + - id: pylint-doc-string + name: pylint + description: Check python docstring style using docstring_checker. + entry: bash ./tools/codestyle/pylint_pre_commit.hook + language: system + files: \.(py)$ +- repo: local + hooks: + - id: copyright_checker + name: copyright_checker + entry: python ./tools/codestyle/copyright.hook + language: system + files: \.(c|cc|cxx|cpp|cu|h|hpp|hxx|proto|py)$ + exclude: (?!.*third_party)^.*$ | (?!.*book)^.*$ diff --git a/python/paddle_fl/paddle_fl/core/master/job_generator.py b/python/paddle_fl/paddle_fl/core/master/job_generator.py index a69ffa16..1093d4b2 100644 --- a/python/paddle_fl/paddle_fl/core/master/job_generator.py +++ b/python/paddle_fl/paddle_fl/core/master/job_generator.py @@ -199,23 +199,29 @@ def generate_fl_job_for_k8s(self, local_job.set_strategy(fl_strategy) local_job.save(output) - def save_program(self, program_path, input_list, hidden_vars, loss): + def save_program(self, + main_prog, + startup_prog, + program_path, + input_list, + hidden_vars, + loss, + learning_rate=None): if not os.path.exists(program_path): os.makedirs(program_path) - main_program_str = fluid.default_main_program( - ).desc.serialize_to_string() - startup_program_str = fluid.default_startup_program( - ).desc.serialize_to_string() - params = fluid.default_main_program().global_block().all_parameters() + main_program_str = main_prog.desc.serialize_to_string() + startup_program_str = startup_prog.desc.serialize_to_string() + params = main_prog.global_block().all_parameters() para_info = [] for pa in params: para_info.append(pa.name) with open(program_path + '/input_names', 'w') as fout: for input in input_list: - fout.write("%s\n" % input.name) - with open(program_path + '/hidden_vars', 'w') as fout: - for var in hidden_vars: - fout.write("%s:%s\n" % (var[0], var[1].name)) + fout.write("%s\n" % input) + if hidden_vars != None: + with open(program_path + '/hidden_vars', 'w') as fout: + for var in hidden_vars: + fout.write("%s:%s\n" % (var[0], var[1].name)) with open(program_path + '/para_info', 'w') as fout: for item in para_info: fout.write("%s\n" % item) @@ -225,6 +231,9 @@ def save_program(self, program_path, input_list, hidden_vars, loss): fout.write(main_program_str) with open(program_path + '/loss_name', 'w') as fout: fout.write(loss.name) + if type(learning_rate) == fluid.Variable: + with open(program_path + '/lr_name', 'w') as fout: + fout.write(learning_rate.name) def generate_fl_job_from_program(self, strategy, endpoints, worker_num, program_input, output): @@ -252,6 +261,12 @@ def generate_fl_job_from_program(self, strategy, endpoints, worker_num, with open(program_input + '/loss_name', 'r') as fin: loss_name = fin.read() + if os.path.exists(program_input + '/lr_name'): + with open(program_input + '/lr_name', 'r') as fin: + lr_name = fin.read() + else: + lr_name = None + for item in para_list: para = new_main.global_block().var(item) para.regularizer = None @@ -262,9 +277,20 @@ def generate_fl_job_from_program(self, strategy, endpoints, worker_num, for var in new_main.list_vars(): if var.name == loss_name: loss = var + if lr_name != None: + if var.name == lr_name: + lr = var + with fluid.program_guard(new_main, new_startup): - optimizer = fluid.optimizer.SGD(learning_rate=0.1, - parameter_list=para_list) + if lr_name != None: + optimizer = fluid.optimizer.MomentumOptimizer( + learning_rate=lr, momentum=0.9, parameter_list=para_list) + else: + optimizer = fluid.optimizer.MomentumOptimizer( + learning_rate=0.00001, + momentum=0.9, + parameter_list=para_list) + exe.run(new_startup) strategy.minimize(optimizer, loss) diff --git a/python/paddle_fl/paddle_fl/core/strategy/fl_distribute_transpiler.py b/python/paddle_fl/paddle_fl/core/strategy/fl_distribute_transpiler.py index 0d204f8f..6715eb27 100644 --- a/python/paddle_fl/paddle_fl/core/strategy/fl_distribute_transpiler.py +++ b/python/paddle_fl/paddle_fl/core/strategy/fl_distribute_transpiler.py @@ -695,7 +695,8 @@ def _init_splited_vars(self): opti_to_param = dict() param_to_opti = dict() for op in self.optimize_ops: - if (op.type == "sgd") or (op.type == "adam"): + if (op.type == "sgd") or (op.type == "adam") or ( + op.type == "momentum"): origin_name = op.output("ParamOut") var = self.origin_program.global_block().var(origin_name[0]) new_var_name = "%s.opti.trainer_%d" % (origin_name[0], diff --git a/python/paddle_fl/paddle_fl/examples/generate_job_from_program/fl_trainer.py b/python/paddle_fl/paddle_fl/examples/generate_job_from_program/fl_trainer.py index 19ca360e..15b8fa5d 100644 --- a/python/paddle_fl/paddle_fl/examples/generate_job_from_program/fl_trainer.py +++ b/python/paddle_fl/paddle_fl/examples/generate_job_from_program/fl_trainer.py @@ -79,6 +79,3 @@ def train_test(train_test_program, train_test_feed, train_test_reader): train_test_feed=feeder) print("Test with epoch %d, accuracy: %s" % (epoch_id, acc_val)) - - save_dir = (output_folder + "/epoch_%d") % epoch_id - trainer.save_inference_program(output_folder) diff --git a/python/paddle_fl/paddle_fl/examples/generate_job_from_program/program_saver.py b/python/paddle_fl/paddle_fl/examples/generate_job_from_program/program_saver.py index e6f75288..880d7a93 100644 --- a/python/paddle_fl/paddle_fl/examples/generate_job_from_program/program_saver.py +++ b/python/paddle_fl/paddle_fl/examples/generate_job_from_program/program_saver.py @@ -25,12 +25,13 @@ accuracy = fluid.layers.accuracy(input=predict, label=label) avg_cost = fluid.layers.mean(sum_cost, name="loss") startup_program = fluid.default_startup_program() +main_program = fluid.default_main_program() place = fluid.CPUPlace() exe = fluid.Executor(place) exe.run(startup_program) job_generator = JobGenerator() program_path = './load_file' -job_generator.save_program(program_path, [input, label], - [['predict', predict], ['accuracy', accuracy]], - avg_cost) +job_generator.save_program( + main_program, startup_program, program_path, [input, label], + [['predict', predict], ['accuracy', accuracy]], avg_cost)