|
17 | 17 | from packagedcode import models |
18 | 18 | from packagedcode.models import Party |
19 | 19 | from packagedcode.models import party_org |
| 20 | +from cluecode.copyrights import detect_copyrights_from_lines |
| 21 | +from cluecode.copyrights import prepare_text_line |
20 | 22 | from typecode import contenttype |
21 | 23 |
|
22 | 24 | TRACE = False |
@@ -237,6 +239,31 @@ def concat(mapping, *keys): |
237 | 239 | return '\n'.join(values) |
238 | 240 |
|
239 | 241 |
|
| 242 | + |
| 243 | +def has_license_with_copyright(text): |
| 244 | + """ |
| 245 | + Return True if the LegalCopyright `text` could have some license |
| 246 | + declarations and should be a part of the extracted_license_statement. |
| 247 | + """ |
| 248 | + copyrights = detect_copyrights_from_lines( |
| 249 | + numbered_lines=[tuple([1, text])], |
| 250 | + include_copyrights=True, |
| 251 | + include_authors=False, |
| 252 | + include_holders=False, |
| 253 | + include_copyright_years=True, |
| 254 | + include_copyright_allrights=True, |
| 255 | + ) |
| 256 | + detections = [detection.to_dict() for detection in copyrights] |
| 257 | + if text and not detections: |
| 258 | + return True |
| 259 | + |
| 260 | + if detections and "copyright" in detections[0]: |
| 261 | + return False |
| 262 | + |
| 263 | + return True |
| 264 | + |
| 265 | + |
| 266 | + |
240 | 267 | class WindowsExecutableHandler(models.NonAssemblableDatafileHandler): |
241 | 268 | datasource_id = 'windows_executable' |
242 | 269 | default_package_type = 'winexe' |
@@ -278,66 +305,70 @@ def is_datafile(cls, location, filetypes=tuple()): |
278 | 305 | @classmethod |
279 | 306 | def parse(cls, location, package_only=False): |
280 | 307 | infos = pe_info(location) |
| 308 | + yield get_package_data_from_pe_info(infos, package_only) |
| 309 | + |
281 | 310 |
|
282 | | - version = get_first( |
283 | | - infos, |
284 | | - 'Full Version', |
285 | | - 'ProductVersion', |
286 | | - 'FileVersion', |
287 | | - 'Assembly Version', |
288 | | - ) |
289 | | - release_date = get_first(infos, 'BuildDate') |
290 | | - if release_date: |
291 | | - if len(release_date) >= 10: |
292 | | - release_date = release_date[:10] |
293 | | - release_date = release_date.replace('/', '-') |
294 | | - |
295 | | - name = get_first( |
296 | | - infos, |
297 | | - 'ProductName', |
298 | | - 'OriginalFilename', |
299 | | - 'InternalName', |
300 | | - ) |
301 | | - copyr = get_first(infos, 'LegalCopyright') |
302 | | - |
303 | | - LegalCopyright = copyr, |
304 | | - |
305 | | - LegalTrademarks = concat( |
306 | | - infos, |
307 | | - 'LegalTrademarks', |
308 | | - 'LegalTrademarks1', |
309 | | - 'LegalTrademarks2', |
310 | | - 'LegalTrademarks3') |
311 | | - |
312 | | - License = get_first(infos, 'License') |
313 | | - |
314 | | - extracted_license_statement = None |
315 | | - if LegalTrademarks or License: |
316 | | - extracted_license_statement = {} |
317 | | - if LegalTrademarks and LegalTrademarks != '': |
318 | | - extracted_license_statement['LegalTrademarks'] = LegalTrademarks |
319 | | - if License: |
320 | | - extracted_license_statement['License'] = License |
321 | | - |
322 | | - description = concat(infos, 'FileDescription', 'Comments') |
323 | | - |
324 | | - parties = [] |
325 | | - cname = get_first(infos, 'CompanyName', 'Company') |
326 | | - |
327 | | - if cname: |
328 | | - parties = [Party(type=party_org, role='author', name=cname)] |
329 | | - homepage_url = get_first(infos, 'URL', 'WWW') |
330 | | - |
331 | | - package_data = dict( |
332 | | - datasource_id=cls.datasource_id, |
333 | | - type=cls.default_package_type, |
334 | | - name=name, |
335 | | - version=version, |
336 | | - release_date=release_date, |
337 | | - copyright=copyr, |
338 | | - extracted_license_statement=extracted_license_statement, |
339 | | - description=description, |
340 | | - parties=parties, |
341 | | - homepage_url=homepage_url, |
342 | | - ) |
343 | | - yield models.PackageData.from_data(package_data, package_only) |
| 311 | +def get_package_data_from_pe_info(infos, package_only=False): |
| 312 | + |
| 313 | + version = get_first( |
| 314 | + infos, |
| 315 | + 'Full Version', |
| 316 | + 'ProductVersion', |
| 317 | + 'FileVersion', |
| 318 | + 'Assembly Version', |
| 319 | + ) |
| 320 | + release_date = get_first(infos, 'BuildDate') |
| 321 | + if release_date: |
| 322 | + if len(release_date) >= 10: |
| 323 | + release_date = release_date[:10] |
| 324 | + release_date = release_date.replace('/', '-') |
| 325 | + |
| 326 | + name = get_first( |
| 327 | + infos, |
| 328 | + 'ProductName', |
| 329 | + 'OriginalFilename', |
| 330 | + 'InternalName', |
| 331 | + ) |
| 332 | + |
| 333 | + LegalCopyright = get_first(infos, 'LegalCopyright') |
| 334 | + copyr_has_license = LegalCopyright and has_license_with_copyright(LegalCopyright) |
| 335 | + LegalTrademarks = concat( |
| 336 | + infos, |
| 337 | + 'LegalTrademarks', |
| 338 | + 'LegalTrademarks1', |
| 339 | + 'LegalTrademarks2', |
| 340 | + 'LegalTrademarks3') |
| 341 | + License = get_first(infos, 'License') |
| 342 | + |
| 343 | + extracted_license_statement = None |
| 344 | + if copyr_has_license or LegalTrademarks or License: |
| 345 | + extracted_license_statement = {} |
| 346 | + if copyr_has_license: |
| 347 | + extracted_license_statement['LegalCopyright'] = LegalCopyright |
| 348 | + if LegalTrademarks and LegalTrademarks != '': |
| 349 | + extracted_license_statement['LegalTrademarks'] = LegalTrademarks |
| 350 | + if License: |
| 351 | + extracted_license_statement['License'] = License |
| 352 | + |
| 353 | + description = concat(infos, 'FileDescription', 'Comments') |
| 354 | + |
| 355 | + parties = [] |
| 356 | + cname = get_first(infos, 'CompanyName', 'Company') |
| 357 | + |
| 358 | + if cname: |
| 359 | + parties = [Party(type=party_org, role='author', name=cname)] |
| 360 | + homepage_url = get_first(infos, 'URL', 'WWW') |
| 361 | + |
| 362 | + package_data = dict( |
| 363 | + datasource_id=WindowsExecutableHandler.datasource_id, |
| 364 | + type=WindowsExecutableHandler.default_package_type, |
| 365 | + name=name, |
| 366 | + version=version, |
| 367 | + release_date=release_date, |
| 368 | + copyright=LegalCopyright, |
| 369 | + extracted_license_statement=extracted_license_statement, |
| 370 | + description=description, |
| 371 | + parties=parties, |
| 372 | + homepage_url=homepage_url, |
| 373 | + ) |
| 374 | + return models.PackageData.from_data(package_data, package_only) |
0 commit comments