FOSSology  4.4.0
Open Source License Compliance by Open Source Software
copyrightDeactivationClutterRemovalScript.py
1 #!/usr/bin/env python3
2 '''
3  Author: Kaushlendra Pratap Singh
4  SPDX-FileCopyrightText: © 2021 Kaushlendra Pratap <kaushlendrapratap.9837@gmail.com>
5  SPDX-FileCopyrightText: © 2023 Abdelrahman Jamal <abdelrahmanjamal5565@gmail.com>
6 
7  SPDX-License-Identifier: GPL-2.0-only
8 '''
9 import pandas as pd
10 import argparse
11 from safaa.Safaa import *
12 
13 def CopyrightFalsePositiveDetection(file, clutter_flag):
14  with open(file, 'r') as f:
15  df = pd.read_json(f, orient='records')
16  agent = SafaaAgent()
17  df['is_copyright'] = agent.predict(df['content'], 0.5)
18  if clutter_flag:
19  df['decluttered_content'] = agent.declutter(df['content'],
20  df['is_copyright'])
21  print(df.to_json(orient='records'))
22 
23 
24 if __name__ == "__main__":
25  parser = argparse.ArgumentParser()
26  parser.add_argument("-f", "--file", help="File to be processed",
27  required=True)
28  parser.add_argument("-c", "--clutter",
29  help="Integer Flag for clutter removal", required=False,
30  action="store_true")
31  args = parser.parse_args()
32  CopyrightFalsePositiveDetection(args.file, args.clutter)