3 Author: Kaushlendra Pratap Singh
4 SPDX-FileCopyrightText: © 2021 Kaushlendra Pratap <kaushlendrapratap.9837@gmail.com>
5 SPDX-FileCopyrightText: © 2023 Abdelrahman Jamal <abdelrahmanjamal5565@gmail.com>
7 SPDX-License-Identifier: GPL-2.0-only
13 def CopyrightFalsePositiveDetection(file, clutter_flag):
14 with open(file,
'r')
as f:
15 df = pd.read_json(f, orient=
'records')
17 df[
'is_copyright'] = agent.predict(df[
'content'], 0.5)
19 df[
'decluttered_content'] = agent.declutter(df[
'content'],
21 print(df.to_json(orient=
'records'))
24 if __name__ ==
"__main__":
25 parser = argparse.ArgumentParser()
26 parser.add_argument(
"-f",
"--file", help=
"File to be processed",
28 parser.add_argument(
"-c",
"--clutter",
29 help=
"Integer Flag for clutter removal", required=
False,
31 args = parser.parse_args()
32 CopyrightFalsePositiveDetection(args.file, args.clutter)