Skip to content

Commit db79e7a

Browse files
committed
Improve copyright detection more
Empty lines can stop a notice continuity. Signed-off-by: Philippe Ombredanne <pombredanne@nexb.com>
1 parent 4939a9b commit db79e7a

37 files changed

+204
-6
lines changed

src/cluecode/copyrights.py

Lines changed: 22 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1357,11 +1357,18 @@ def build_detection_from_node(
13571357
(r'^EXHIBIT$', 'JUNK'),
13581358
(r'^Exhibit$', 'JUNK'),
13591359
(r'^Digitized', 'NN'),
1360+
(r'^OPENING', 'JUNK'),
13601361
(r'^[Ds]istributed?.?$', 'NN'),
13611362
(r'^Distributions?', 'NN'),
13621363
(r'^Multiply$', 'NN'),
13631364
(r'^Convert$', 'NN'),
13641365
(r'^Compute$', 'NN'),
1366+
1367+
(r'^\(Computer$', 'JUNK'),
1368+
(r'^Programs\)', 'JUNK'),
1369+
(r'^Regulations', 'JUNK'),
1370+
(r'^message\.', 'JUNK'),
1371+
13651372
(r'^Case$', 'NN'),
13661373
(r'^Hessian$', 'NN'),
13671374
(r'^Include', 'NN'),
@@ -1434,6 +1441,10 @@ def build_detection_from_node(
14341441
(r'^IA64$', 'NN'),
14351442
(r'^IDEA$', 'NN'),
14361443
(r'^Id$', 'NN'),
1444+
1445+
# micapitalized last name
1446+
(r'^king$', 'NNP'),
1447+
14371448
(r'^IDENTIFICATION?\.?$', 'NN'),
14381449
(r'^IEEE$', 'NN'),
14391450
(r'^If$', 'NN'),
@@ -1444,6 +1455,8 @@ def build_detection_from_node(
14441455
(r'^INCLUDING', 'NN'),
14451456
(r'^Indemnification', 'NN'),
14461457
(r'^Indemnified', 'NN'),
1458+
(r'^Unified$', 'NN'),
1459+
(r'^Cleaned$', 'JUNK'),
14471460
(r'^Information', 'NN'),
14481461
(r'^In$', 'NN'),
14491462
(r'^Intellij$', 'NN'),
@@ -1540,7 +1553,7 @@ def build_detection_from_node(
15401553
(r'^[Rr]espective', 'NN'),
15411554
(r'^SAX$', 'NN'),
15421555
(r'^Sections?$', 'NN'),
1543-
(r'^Send$', 'NN'),
1556+
(r'^Send$', 'JUNK'),
15441557
(r'^Separa', 'NN'),
15451558
(r'^Service$', 'NN'),
15461559
(r'^Several$', 'NN'),
@@ -2160,7 +2173,8 @@ def build_detection_from_node(
21602173
# a .sh shell scripts is NOT an email.
21612174
(r'^.*\.sh\.?$', 'JUNK'),
21622175
# email eventually in parens or brackets with some trailing punct. Note the @ or "at "
2163-
(r'^[\<\(]?[a-zA-Z0-9]+[a-zA-Z0-9\+_\-\.\%]*(@|at)[a-zA-Z0-9][a-zA-Z0-9\+_\-\.\%]+\.[a-zA-Z]{2,3}[\>\)\.\,]*$', 'EMAIL'),
2176+
(r'^(?:[A-Za-z])*[\<\(]?[a-zA-Z0-9]+[a-zA-Z0-9\+_\-\.\%]*(@|at)[a-zA-Z0-9][a-zA-Z0-9\+_\-\.\%]+\.[a-zA-Z]{2,3}[\>\)\.\,]*$', 'EMAIL'),
2177+
21642178
# mailto URLs
21652179
(r'^mailto:.{2,}@.{2,}\.[a-z]{2,3}', 'EMAIL'),
21662180

@@ -2902,6 +2916,9 @@ def build_detection_from_node(
29022916
# Copyright 2018 (c) DistributedLock
29032917
COPYRIGHT: {<COPY> <YR-RANGE> <COPY> <NNP>} #230020
29042918
2919+
# Copyright (C) 1999-2000 VA Linux Systems
2920+
COPYRIGHT: {<COPY> <COPY> <YR-RANGE> <CAPS> <NN> <NNP>} #2280-1
2921+
29052922
COPYRIGHT2: {<COPY>+ <NN|CAPS>? <YR-RANGE>+ <PN>*} #2280
29062923
29072924
# using #2280 above: Copyright 2018 Developers of the Rand project
@@ -3043,6 +3060,9 @@ def build_detection_from_node(
30433060
#Copyright or Copr. CNRS
30443061
NAME-CAPS: {<CAPS>+} #2530
30453062
3063+
# (C) SGI 2006, Christoph Lameter
3064+
COPYRIGHT: {<COPY> <NAME-CAPS> <NAME-YEAR> } #25501
3065+
30463066
#Copyright or Copr. CNRS
30473067
COPYRIGHT: {<COPY> <NN> <COPY> <COPYRIGHT|NAME-CAPS>} #2560
30483068
COPYRIGHT: {<COPYRIGHT2> <BY> <NAME-CAPS>} #2561

src/licensedcode/data/licenses/maxmind-geolite2-eula-2019.LICENSE

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -10,7 +10,7 @@ ignorable_authors:
1010
- the USA Department of Commerce
1111
- the USA Department of State. Specifically
1212
- the USA Treasury Department's Office of Foreign Assets Control, and the International
13-
Traffic in Arms Regulations
13+
Traffic in Arms
1414
ignorable_urls:
1515
- http://www.maxmind.com/
1616
- https://www.maxmind.com/
@@ -114,4 +114,4 @@ Should any provision of this Agreement be held void, invalid, or inoperative, su
114114

115115
COMPLIANCE WITH LAW.
116116

117-
Notwithstanding any provisions of this Agreement to the contrary, you shall in performance of this Agreement comply with all applicable laws, executive orders, regulations ordinances and rules of all governments (“Applicable Laws”), including all applicable export and re-export control laws and regulations, such as the Export Administration Regulations (“EAR”) maintained by the USA Department of Commerce, trade and economic sanctions maintained by the USA Treasury Department’s Office of Foreign Assets Control, and the International Traffic in Arms Regulations (“ITAR”) maintained by the USA Department of State. Specifically, and without limitation, you agree that you shall not, directly or indirectly, sell, export, re-export, transfer, divert, or otherwise dispose of any Services (including products derived from or based on such Services) to any destination, entity, or person prohibited by the laws or regulations of the USA, without obtaining prior authorization from the competent government authorities as required by those laws and regulations.
117+
Notwithstanding any provisions of this Agreement to the contrary, you shall in performance of this Agreement comply with all applicable laws, executive orders, regulations ordinances and rules of all governments (“Applicable Laws”), including all applicable export and re-export control laws and regulations, such as the Export Administration Regulations (“EAR”) maintained by the USA Department of Commerce, trade and economic sanctions maintained by the USA Treasury Department’s Office of Foreign Assets Control, and the International Traffic in Arms Regulations (“ITAR”) maintained by the USA Department of State. Specifically, and without limitation, you agree that you shall not, directly or indirectly, sell, export, re-export, transfer, divert, or otherwise dispose of any Services (including products derived from or based on such Services) to any destination, entity, or person prohibited by the laws or regulations of the USA, without obtaining prior authorization from the competent government authorities as required by those laws and regulations.

tests/cluecode/data/copyrights/misco4/linux2/designer.txt.yml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -3,6 +3,6 @@ what:
33
- holders
44
- authors
55
copyrights:
6-
- Copyright (c) IBM Corporation, 2011-2015
6+
- Copyright (c) IBM Corporation, 2011-2015 Designer of the Power
77
holders:
8-
- IBM Corporation
8+
- IBM Corporation, Designer of the Power
Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1 @@
1+
MediaTek Inc. (c) 2008 BY OPENING
Lines changed: 8 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,8 @@
1+
what:
2+
- copyrights
3+
- holders
4+
- authors
5+
copyrights:
6+
- MediaTek Inc. (c) 2008
7+
holders:
8+
- MediaTek Inc.
Lines changed: 6 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,6 @@
1+
0.0.16
2+
Modified Copyright message.
3+
0.0.17
4+
Implement Mic and Line in Capture.
5+
0.0.18
6+
Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,4 @@
1+
what:
2+
- copyrights
3+
- holders
4+
- authors
Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,4 @@
1+
Developed by:
2+
3+
LLVM Team
4+
Lines changed: 6 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,6 @@
1+
what:
2+
- copyrights
3+
- holders
4+
- authors
5+
authors:
6+
- LLVM Team
Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,2 @@
1+
* Copyright (C) 1997-2002 Russell king
2+

0 commit comments

Comments
 (0)