diff --git a/Pipfile b/Pipfile index 9a0f50e..ad561a6 100644 --- a/Pipfile +++ b/Pipfile @@ -17,6 +17,15 @@ trino = "*" pandas = "*" pyarrow = "*" python-dotenv = "*" +pdf2image = "*" +mmdet = "*" +mmcv-full = "*" +torch = "*" +torchvision = "*" +tabula-py = "*" +gdown = "*" +pdfminer.six = "*" +fuzzywuzzy = "*" python-Levenshtein = "*" [requires] diff --git a/Pipfile.lock b/Pipfile.lock index ed3156c..3121b35 100644 --- a/Pipfile.lock +++ b/Pipfile.lock @@ -1,7 +1,7 @@ { "_meta": { "hash": { - "sha256": "68b49a0efd714a801b8429f1778f95757045bdfaacad8ce51ffc99f19b6aad31" + "sha256": "91bc1a42ee60829f9ad8a1b1de4ebe1981c448fa6aededdb87d4b285d3a0d55b" }, "pipfile-spec": 6, "requires": { @@ -16,36 +16,43 @@ ] }, "default": { + "addict": { + "hashes": [ + "sha256:249bb56bbfd3cdc2a004ea0ff4c2b6ddc84d53bc2194761636eb314d5cfa5dfc", + "sha256:b3b2210e0e067a281f5646c8c5db92e99b7231ea8b0eb5f74dbdf9e259d4e494" + ], + "version": "==2.4.0" + }, "awscli": { "hashes": [ - "sha256:608366218de43c6326b9b1d044d3fc44dc02da70ce251fe941d4ecc7392b07d9", - "sha256:b2d9ee3e86c1288a4a0388932864cee6498c125ee0ac575936bcb3e344b9f7d3" + "sha256:299967d021a3799d7f48a0f56e66ed5d064cdb97cf87a7a59ba850be9b57d4ff", + "sha256:6925b1e92765b89dea044551786917364a4b7f59bbec46ed1b27d1db28d79238" ], "index": "pypi", - "version": "==1.20.54" + "version": "==1.20.58" }, "boto3": { "hashes": [ - "sha256:2d81dc484020059fc738165984304107d4db1c6774b6310d08c892a1751f6980", - "sha256:f22a77098cd70ddf848df6981ec57b92178e9d8eb74637edbdf4173bfa9279fa" + "sha256:7309552da6ef9e610f8a9712c8abe29a8d3d45b514188cc3efad47bd1774bf77", + "sha256:f680dee9c670d42ab4a6da5539ca3691d1ccbbcbf041e7021025029776864156" ], "index": "pypi", - "version": "==1.18.54" + "version": "==1.18.58" }, "botocore": { "hashes": [ - "sha256:46127b3a385d0ec73d1994b8958b23b79e0613e12c486371a100df992b72a1b9", - "sha256:56b74a5186bec835baf580b2d062ea1738d3ff5a573653d41b3ad1598a5b77c4" + "sha256:87e881569c32b218a1b82ecb607a4dddb4dca3b80a5d1016571b99b51cef3158", + "sha256:9d84a97015c0565a81c0b6d55e60af5ab1a2da28039ad93976388014a14186da" ], "markers": "python_version >= '3.6'", - "version": "==1.21.54" + "version": "==1.21.58" }, "certifi": { "hashes": [ - "sha256:2bbf76fd432960138b3ef6dda3dde0544f27cbf8546c458e60baf371917ba9ee", - "sha256:50b1e4f8446b06f41be7dd6338db18e0990601dce795c2b1686458aa7e8fa7d8" + "sha256:78884e7c1d4b00ce3cea67b44566851c4343c120abd683433ce934a68ea58872", + "sha256:d62a0163eb4c2344ac042ab2bdf75399a71a2d8c7d47eac2e2ee91b9d6339569" ], - "version": "==2021.5.30" + "version": "==2021.10.8" }, "charset-normalizer": { "hashes": [ @@ -57,11 +64,11 @@ }, "click": { "hashes": [ - "sha256:8c04c11192119b1ef78ea049e0a6f0463e4c48ef00a30160c704337586f3ad7a", - "sha256:fba402a4a47334742d782209a7c79bc448911afe1149d07bdabdf480b3e2f4b6" + "sha256:353f466495adaeb40b6b5f592f9f91cb22372351c84caeb068132442a4518ef3", + "sha256:410e932b050f5eed773c4cda94de75971c89cdb3155a72a0831139a79e5ecb5b" ], "markers": "python_version >= '3.6'", - "version": "==8.0.1" + "version": "==8.0.3" }, "colorama": { "hashes": [ @@ -71,6 +78,65 @@ "markers": "python_version >= '2.7' and python_version not in '3.0, 3.1, 3.2, 3.3, 3.4'", "version": "==0.4.3" }, + "cycler": { + "hashes": [ + "sha256:1d8a5ae1ff6c5cf9b93e8811e581232ad8920aeec647c37316ceac982b08cb2d", + "sha256:cd7b2d1018258d7247a71425e9f26463dfb444d411c39569972f4ce586b0c9d8" + ], + "version": "==0.10.0" + }, + "cython": { + "hashes": [ + "sha256:09ac3087ac7a3d489ebcb3fb8402e00c13d1a3a1c6bc73fd3b0d756a3e341e79", + "sha256:0a142c6b862e6ed6b02209d543062c038c110585b5e32d1ad7c9717af4f07e41", + "sha256:0d414458cb22f8a90d64260da6dace5d5fcebde43f31be52ca51f818c46db8cb", + "sha256:10cb3def9774fa99e4583617a5616874aed3255dc241fd1f4a3c2978c78e1c53", + "sha256:112efa54a58293a4fb0acf0dd8e5b3736e95b595eee24dd88615648e445abe41", + "sha256:166f9f29cd0058ce1a14a7b3a2458b849ed34b1ec5fd4108af3fdd2c24afcbb0", + "sha256:2d9e61ed1056a3b6a4b9156b62297ad18b357a7948e57a2f49b061217696567e", + "sha256:2f41ef7edd76dd23315925e003f0c58c8585f3ab24be6885c4b3f60e77c82746", + "sha256:37bcfa5df2a3009f49624695d917c3804fccbdfcdc5eda6378754a879711a4d5", + "sha256:416046a98255eff97ec02077d20ebeaae52682dfca1c35aadf31260442b92514", + "sha256:4cf4452f0e4d50e11701bca38f3857fe6fa16593e7fd6a4d5f7be66f611b7da2", + "sha256:55b0ee28c2c8118bfb3ad9b25cf7a6cbd724e442ea96956e32ccd908d5e3e043", + "sha256:5dd56d0be50073f0e54825a8bc3393852de0eed126339ecbca0ae149dba55cfc", + "sha256:5fa12ebafc2f688ea6d26ab6d1d2e634a9872509ba7135b902bb0d8b368fb04b", + "sha256:5fb977945a2111f6b64501fdf7ed0ec162cc502b84457fd648d6a558ea8de0d6", + "sha256:60c958bcab0ff315b4036a949bed1c65334e1f6a69e17e9966d742febb59043a", + "sha256:661dbdea519d9cfb288867252b75fef73ffa8e8bb674cec27acf70646afb369b", + "sha256:6a2cf2ccccc25413864928dfd730c29db6f63eaf98206c1e600003a445ca7f58", + "sha256:6ade74eece909fd3a437d9a5084829180751d7ade118e281e9824dd75eafaff2", + "sha256:73ac33a4379056a02031baa4def255717fadb9181b5ac2b244792d53eae1c925", + "sha256:76cbca0188d278e93d12ebdaf5990678e6e436485fdfad49dbe9b07717d41a3c", + "sha256:774cb8fd931ee1ba52c472bc1c19077cd6895c1b24014ae07bb27df59aed5ebe", + "sha256:821c2d416ad7d006b069657ee1034c0e0cb45bdbe9ab6ab631e8c495dfcfa4ac", + "sha256:84826ec1c11cda56261a252ddecac0c7d6b02e47e81b94f40b27b4c23c29c17c", + "sha256:854fe2193d3ad4c8b61932ff54d6dbe10c5fa8749eb8958d72cc0ab28243f833", + "sha256:88dc3c250dec280b0489a83950b15809762e27232f4799b1b8d0bad503f5ab84", + "sha256:8cb87777e82d1996aef6c146560a19270684271c9c669ba62ac6803b3cd2ff82", + "sha256:91339ee4b465924a3ea4b2a9cec7f7227bc4cadf673ce859d24c2b9ef60b1214", + "sha256:9164aeef1af6f837e4fc20402a31d256188ba4d535e262c6cb78caf57ad744f8", + "sha256:a102cfa795c6b3b81a29bdb9dbec545367cd7f353c03e6f30a056fdfefd92854", + "sha256:ad43e684ade673565f6f9d6638015112f6c7f11aa2a632167b79014f613f0f5f", + "sha256:afb521523cb46ddaa8d269b421f88ea2731fee05e65b952b96d4db760f5a2a1c", + "sha256:b28f92e617f540d3f21f8fd479a9c6491be920ffff672a4c61b7fc4d7f749f39", + "sha256:bc05de569f811be1fcfde6756c9048ae518f0c4b6d9f8f024752c5365d934cac", + "sha256:cdf04d07c3600860e8c2ebaad4e8f52ac3feb212453c1764a49ac08c827e8443", + "sha256:d8d1a087f35e39384303f5e6b75d465d6f29d746d7138eae9d3b6e8e6f769eae", + "sha256:eb2843f8cc01c645725e6fc690a84e99cdb266ce8ebe427cf3a680ff09f876aa", + "sha256:f2e9381497b12e8f622af620bde0d1d094035d79b899abb2ddd3a7891f535083", + "sha256:f96411f0120b5cae483923aaacd2872af8709be4b46522daedc32f051d778385" + ], + "markers": "python_version >= '2.6' and python_version not in '3.0, 3.1, 3.2, 3.3'", + "version": "==0.29.24" + }, + "distro": { + "hashes": [ + "sha256:83f5e5a09f9c5f68f60173de572930effbcc0287bb84fdc4426cb4168c088424", + "sha256:c8713330ab31a034623a9515663ed87696700b55f04556b97c39cd261aa70dc7" + ], + "version": "==1.6.0" + }, "docutils": { "hashes": [ "sha256:6c4f696463b79f1fb8ba0c594b63840ebd41f059e92b31957c46b74a4599b6d0", @@ -80,6 +146,29 @@ "markers": "python_version >= '2.6' and python_version not in '3.0, 3.1, 3.2, 3.3'", "version": "==0.15.2" }, + "filelock": { + "hashes": [ + "sha256:8c7eab13dc442dc249e95158bcc12dec724465919bdc9831fdbf0660f03d1785", + "sha256:bbc6a0382fe8ec4744ecdf6683a2e07f65eb10ff1aff53fc02a202565446cde0" + ], + "markers": "python_version >= '3.6'", + "version": "==3.3.0" + }, + "fuzzywuzzy": { + "hashes": [ + "sha256:45016e92264780e58972dca1b3d939ac864b78437422beecebb3095f8efd00e8", + "sha256:928244b28db720d1e0ee7587acf660ea49d7e4c632569cad4f1cd7e68a5f0993" + ], + "index": "pypi", + "version": "==0.18.0" + }, + "gdown": { + "hashes": [ + "sha256:5d261cde60ac156fb1e9a6450cdb5413d947bfdbcf52f91db2a99bb455fb690c" + ], + "index": "pypi", + "version": "==4.0.2" + }, "idna": { "hashes": [ "sha256:14475042e284991034cb48e06f6851428fb14c4dc953acd9be9a5e95c7b6dd7a", @@ -96,6 +185,98 @@ "markers": "python_version >= '2.6' and python_version not in '3.0, 3.1, 3.2, 3.3'", "version": "==0.10.0" }, + "kiwisolver": { + "hashes": [ + "sha256:0007840186bacfaa0aba4466d5890334ea5938e0bb7e28078a0eb0e63b5b59d5", + "sha256:19554bd8d54cf41139f376753af1a644b63c9ca93f8f72009d50a2080f870f77", + "sha256:1d45d1c74f88b9f41062716c727f78f2a59a5476ecbe74956fafb423c5c87a76", + "sha256:1d819553730d3c2724582124aee8a03c846ec4362ded1034c16fb3ef309264e6", + "sha256:2210f28778c7d2ee13f3c2a20a3a22db889e75f4ec13a21072eabb5693801e84", + "sha256:22521219ca739654a296eea6d4367703558fba16f98688bd8ce65abff36eaa84", + "sha256:25405f88a37c5f5bcba01c6e350086d65e7465fd1caaf986333d2a045045a223", + "sha256:2b65bd35f3e06a47b5c30ea99e0c2b88f72c6476eedaf8cfbc8e66adb5479dcf", + "sha256:2ddb500a2808c100e72c075cbb00bf32e62763c82b6a882d403f01a119e3f402", + "sha256:2f8f6c8f4f1cff93ca5058d6ec5f0efda922ecb3f4c5fb76181f327decff98b8", + "sha256:30fa008c172355c7768159983a7270cb23838c4d7db73d6c0f6b60dde0d432c6", + "sha256:3dbb3cea20b4af4f49f84cffaf45dd5f88e8594d18568e0225e6ad9dec0e7967", + "sha256:4116ba9a58109ed5e4cb315bdcbff9838f3159d099ba5259c7c7fb77f8537492", + "sha256:44e6adf67577dbdfa2d9f06db9fbc5639afefdb5bf2b4dfec25c3a7fbc619536", + "sha256:5326ddfacbe51abf9469fe668944bc2e399181a2158cb5d45e1d40856b2a0589", + "sha256:70adc3658138bc77a36ce769f5f183169bc0a2906a4f61f09673f7181255ac9b", + "sha256:72be6ebb4e92520b9726d7146bc9c9b277513a57a38efcf66db0620aec0097e0", + "sha256:7843b1624d6ccca403a610d1277f7c28ad184c5aa88a1750c1a999754e65b439", + "sha256:7ba5a1041480c6e0a8b11a9544d53562abc2d19220bfa14133e0cdd9967e97af", + "sha256:80efd202108c3a4150e042b269f7c78643420cc232a0a771743bb96b742f838f", + "sha256:82f49c5a79d3839bc8f38cb5f4bfc87e15f04cbafa5fbd12fb32c941cb529cfb", + "sha256:83d2c9db5dfc537d0171e32de160461230eb14663299b7e6d18ca6dca21e4977", + "sha256:8d93a1095f83e908fc253f2fb569c2711414c0bfd451cab580466465b235b470", + "sha256:8dc3d842fa41a33fe83d9f5c66c0cc1f28756530cd89944b63b072281e852031", + "sha256:9661a04ca3c950a8ac8c47f53cbc0b530bce1b52f516a1e87b7736fec24bfff0", + "sha256:a498bcd005e8a3fedd0022bb30ee0ad92728154a8798b703f394484452550507", + "sha256:a7a4cf5bbdc861987a7745aed7a536c6405256853c94abc9f3287c3fa401b174", + "sha256:b5074fb09429f2b7bc82b6fb4be8645dcbac14e592128beeff5461dcde0af09f", + "sha256:b6a5431940f28b6de123de42f0eb47b84a073ee3c3345dc109ad550a3307dd28", + "sha256:ba677bcaff9429fd1bf01648ad0901cea56c0d068df383d5f5856d88221fe75b", + "sha256:bcadb05c3d4794eb9eee1dddf1c24215c92fb7b55a80beae7a60530a91060560", + "sha256:bf7eb45d14fc036514c09554bf983f2a72323254912ed0c3c8e697b62c4c158f", + "sha256:c358721aebd40c243894298f685a19eb0491a5c3e0b923b9f887ef1193ddf829", + "sha256:c4550a359c5157aaf8507e6820d98682872b9100ce7607f8aa070b4b8af6c298", + "sha256:c6572c2dab23c86a14e82c245473d45b4c515314f1f859e92608dcafbd2f19b8", + "sha256:cba430db673c29376135e695c6e2501c44c256a81495da849e85d1793ee975ad", + "sha256:dedc71c8eb9c5096037766390172c34fb86ef048b8e8958b4e484b9e505d66bc", + "sha256:e6f5eb2f53fac7d408a45fbcdeda7224b1cfff64919d0f95473420a931347ae9", + "sha256:ec2eba188c1906b05b9b49ae55aae4efd8150c61ba450e6721f64620c50b59eb", + "sha256:ee040a7de8d295dbd261ef2d6d3192f13e2b08ec4a954de34a6fb8ff6422e24c", + "sha256:eedd3b59190885d1ebdf6c5e0ca56828beb1949b4dfe6e5d0256a461429ac386", + "sha256:f441422bb313ab25de7b3dbfd388e790eceb76ce01a18199ec4944b369017009", + "sha256:f8eb7b6716f5b50e9c06207a14172cf2de201e41912ebe732846c02c830455b9", + "sha256:fc4453705b81d03568d5b808ad8f09c77c47534f6ac2e72e733f9ca4714aa75c" + ], + "markers": "python_version >= '3.7'", + "version": "==1.3.2" + }, + "matplotlib": { + "hashes": [ + "sha256:01c9de93a2ca0d128c9064f23709362e7fefb34910c7c9e0b8ab0de8258d5eda", + "sha256:41b6e307458988891fcdea2d8ecf84a8c92d53f84190aa32da65f9505546e684", + "sha256:48e1e0859b54d5f2e29bb78ca179fd59b971c6ceb29977fb52735bfd280eb0f5", + "sha256:54a026055d5f8614f184e588f6e29064019a0aa8448450214c0b60926d62d919", + "sha256:556965514b259204637c360d213de28d43a1f4aed1eca15596ce83f768c5a56f", + "sha256:5c988bb43414c7c2b0a31bd5187b4d27fd625c080371b463a6d422047df78913", + "sha256:6a724e3a48a54b8b6e7c4ae38cd3d07084508fa47c410c8757e9db9791421838", + "sha256:6be8df61b1626e1a142c57e065405e869e9429b4a6dab4a324757d0dc4d42235", + "sha256:844a7b0233e4ff7fba57e90b8799edaa40b9e31e300b8d5efc350937fa8b1bea", + "sha256:85f0c9cf724715e75243a7b3087cf4a3de056b55e05d4d76cc58d610d62894f3", + "sha256:a78a3b51f29448c7f4d4575e561f6b0dbb8d01c13c2046ab6c5220eb25c06506", + "sha256:b884715a59fec9ad3b6048ecf3860f3b2ce965e676ef52593d6fa29abcf7d330", + "sha256:b8b53f336a4688cfce615887505d7e41fd79b3594bf21dd300531a4f5b4f746a", + "sha256:c70b6311dda3e27672f1bf48851a0de816d1ca6aaf3d49365fbdd8e959b33d2b", + "sha256:ebfb01a65c3f5d53a8c2a8133fec2b5221281c053d944ae81ff5822a68266617", + "sha256:eeb1859efe7754b1460e1d4991bbd4a60a56f366bc422ef3a9c5ae05f0bc70b5", + "sha256:f15edcb0629a0801738925fe27070480f446fcaa15de65946ff946ad99a59a40", + "sha256:f1c5efc278d996af8a251b2ce0b07bbeccb821f25c8c9846bdcb00ffc7f158aa", + "sha256:f72657f1596199dc1e4e7a10f52a4784ead8a711f4e5b59bea95bdb97cf0e4fd", + "sha256:fc4f526dfdb31c9bd6b8ca06bf9fab663ca12f3ec9cdf4496fb44bc680140318", + "sha256:fcd6f1954943c0c192bfbebbac263f839d7055409f1173f80d8b11a224d236da" + ], + "markers": "python_version >= '3.7'", + "version": "==3.4.3" + }, + "mmcv-full": { + "hashes": [ + "sha256:d8b7c7d6a186ddc97a8d606df14671397f5bc6d6e893c8f774d39c0dbd24bc69" + ], + "index": "pypi", + "version": "==1.3.14" + }, + "mmdet": { + "hashes": [ + "sha256:4277baf39269e2d4d074a436dba34acf12d5eedb3883d5e4f0998bbea668bc83", + "sha256:a79196e57735cee88c53939f1bbe3cf22ec5f4bd4646aafc250b36241c4aa62e" + ], + "index": "pypi", + "version": "==2.17.0" + }, "numpy": { "hashes": [ "sha256:09858463db6dd9f78b2a1a05c93f3b33d4f65975771e90d2cf7aadb7c2f66edf", @@ -132,6 +313,44 @@ "markers": "python_version < '3.11' and python_version >= '3.7'", "version": "==1.21.2" }, + "opencv-python": { + "hashes": [ + "sha256:05c5139d620e8d02f7ce0921796d55736fa19fa15e2ec00a388db2eb1ae1e9a1", + "sha256:085232718f28bddd265da480874c37db5c7354cb08f23f4a68a8639b16276a89", + "sha256:18a4a14015eee30d9cd514db8cdefbf594b1d5c234762d27abe512d62a333bc3", + "sha256:205a73adb29c37e42475645519e612e843a985475da993d10b4d5daa6afec36a", + "sha256:3c001d3feec7f3140f1fb78dfc52ca28122db8240826882d175a208a89d2731b", + "sha256:437f30e300725e1d1b3744dbfbc66a523a4744792b58f3dbe1e9140c8f4dfba5", + "sha256:5366fcd6eae4243add3c8c92142045850f1db8e464bcf0b75313e1596b2e3671", + "sha256:54c64e86a087841869901fd34462bb6bec01cd4652800fdf5d92fe7b0596c82f", + "sha256:6763729fcfee2a08e069aa1982c9a8c1abf55b9cdf2fb9640eda1d85bdece19a", + "sha256:68813b720b88e4951e84399b9a8a7b532d45a07a96ea8f539636242f862e32e0", + "sha256:7f41b97d84ac66bdf13cb4d9f4dad3e159525ba1e3f421e670c787ce536eb70a", + "sha256:831b92fe63ce18dd628f71104da7e60596658b75e2fa16b83aefa3eb10c115e2", + "sha256:881f3d85269500e0c7d72b140a6ebb5c14a089f8140fb9da7ce01f12a245858e", + "sha256:8852be06c0749fef0d9c58f532bbcb0570968c59e41cf56b90f5c92593c6e108", + "sha256:8b5bc61be7fc8565140b746288b370a4bfdb4edb9d680b66bb914e7690485db1", + "sha256:8d3282138f3a8646941089aae142684910ebe40776266448eab5f4bb609fc63f", + "sha256:9a78558b5ae848386edbb843c761e5fed5a8480be9af16274a5a78838529edeb", + "sha256:b42bbba9f5421865377c7960bd4f3dd881003b322a6bf46ed2302b89224d102b", + "sha256:c360cb76ad1ddbd5d2d3e730b42f2ff6e4be08ea6f4a6eefacca175d27467e8f", + "sha256:cdc3363c2911d7cfc6c9f55308c51c2841a7aecbf0bf5e791499d220ce89d880", + "sha256:e1f54736272830a1e895cedf7a4ee67737e31e966d380c82a81ef22515d043a3", + "sha256:e42c644a70d5c54f53a4b114dbd88b4eb83f42a9ca998f07bd5682f3f404efcc", + "sha256:f1bda4d144f5204e077ca4571453ebb2015e5748d5e0043386c92c2bbf7f52eb", + "sha256:f3ac2355217114a683f3f72a9c40a5890914a59c4a2df62e4083c66ff65c9cf9" + ], + "markers": "python_version >= '3.6'", + "version": "==4.5.3.56" + }, + "packaging": { + "hashes": [ + "sha256:7dc96269f53a4ccec5c0670940a4281106dd0bb343f47b7471f779df49c2fbe7", + "sha256:c86254f9220d55e31cc94d69bade760f0847da8000def4dfe1c6b872fd14ff14" + ], + "markers": "python_version >= '3.6'", + "version": "==21.0" + }, "pandas": { "hashes": [ "sha256:272c8cb14aa9793eada6b1ebe81994616e647b5892a370c7135efb2924b701df", @@ -159,6 +378,81 @@ "index": "pypi", "version": "==1.3.3" }, + "pdf2image": { + "hashes": [ + "sha256:84f79f2b8fad943e36323ea4e937fcb05f26ded0caa0a01181df66049e42fb65", + "sha256:d58ed94d978a70c73c2bb7fdf8acbaf2a7089c29ff8141be5f45433c0c4293bb" + ], + "index": "pypi", + "version": "==1.16.0" + }, + "pdfminer": { + "hashes": [ + "sha256:9e700bc731300ed5c8936343c1dd4529638184198e54e91dd2b59b64a755dc01" + ], + "index": "pypi", + "six": "*", + "version": "==20191125" + }, + "pillow": { + "hashes": [ + "sha256:0412516dcc9de9b0a1e0ae25a280015809de8270f134cc2c1e32c4eeb397cf30", + "sha256:04835e68ef12904bc3e1fd002b33eea0779320d4346082bd5b24bec12ad9c3e9", + "sha256:06d1adaa284696785375fa80a6a8eb309be722cf4ef8949518beb34487a3df71", + "sha256:085a90a99404b859a4b6c3daa42afde17cb3ad3115e44a75f0d7b4a32f06a6c9", + "sha256:0b9911ec70731711c3b6ebcde26caea620cbdd9dcb73c67b0730c8817f24711b", + "sha256:10e00f7336780ca7d3653cf3ac26f068fa11b5a96894ea29a64d3dc4b810d630", + "sha256:11c27e74bab423eb3c9232d97553111cc0be81b74b47165f07ebfdd29d825875", + "sha256:11eb7f98165d56042545c9e6db3ce394ed8b45089a67124298f0473b29cb60b2", + "sha256:13654b521fb98abdecec105ea3fb5ba863d1548c9b58831dd5105bb3873569f1", + "sha256:15ccb81a6ffc57ea0137f9f3ac2737ffa1d11f786244d719639df17476d399a7", + "sha256:18a07a683805d32826c09acfce44a90bf474e6a66ce482b1c7fcd3757d588df3", + "sha256:19ec4cfe4b961edc249b0e04b5618666c23a83bc35842dea2bfd5dfa0157f81b", + "sha256:1c3ff00110835bdda2b1e2b07f4a2548a39744bb7de5946dc8e95517c4fb2ca6", + "sha256:27a330bf7014ee034046db43ccbb05c766aa9e70b8d6c5260bfc38d73103b0ba", + "sha256:2b11c9d310a3522b0fd3c35667914271f570576a0e387701f370eb39d45f08a4", + "sha256:2c661542c6f71dfd9dc82d9d29a8386287e82813b0375b3a02983feac69ef864", + "sha256:2cde7a4d3687f21cffdf5bb171172070bb95e02af448c4c8b2f223d783214056", + "sha256:2d5e9dc0bf1b5d9048a94c48d0813b6c96fccfa4ccf276d9c36308840f40c228", + "sha256:2f23b2d3079522fdf3c09de6517f625f7a964f916c956527bed805ac043799b8", + "sha256:35d27687f027ad25a8d0ef45dd5208ef044c588003cdcedf05afb00dbc5c2deb", + "sha256:35d409030bf3bd05fa66fb5fdedc39c521b397f61ad04309c90444e893d05f7d", + "sha256:4326ea1e2722f3dc00ed77c36d3b5354b8fb7399fb59230249ea6d59cbed90da", + "sha256:4abc247b31a98f29e5224f2d31ef15f86a71f79c7f4d2ac345a5d551d6393073", + "sha256:4d89a2e9219a526401015153c0e9dd48319ea6ab9fe3b066a20aa9aee23d9fd3", + "sha256:4e59e99fd680e2b8b11bbd463f3c9450ab799305d5f2bafb74fefba6ac058616", + "sha256:548794f99ff52a73a156771a0402f5e1c35285bd981046a502d7e4793e8facaa", + "sha256:56fd98c8294f57636084f4b076b75f86c57b2a63a8410c0cd172bc93695ee979", + "sha256:59697568a0455764a094585b2551fd76bfd6b959c9f92d4bdec9d0e14616303a", + "sha256:6bff50ba9891be0a004ef48828e012babaaf7da204d81ab9be37480b9020a82b", + "sha256:6cb3dd7f23b044b0737317f892d399f9e2f0b3a02b22b2c692851fb8120d82c6", + "sha256:7dbfbc0020aa1d9bc1b0b8bcf255a7d73f4ad0336f8fd2533fcc54a4ccfb9441", + "sha256:838eb85de6d9307c19c655c726f8d13b8b646f144ca6b3771fa62b711ebf7624", + "sha256:8b68f565a4175e12e68ca900af8910e8fe48aaa48fd3ca853494f384e11c8bcd", + "sha256:8f284dc1695caf71a74f24993b7c7473d77bc760be45f776a2c2f4e04c170550", + "sha256:963ebdc5365d748185fdb06daf2ac758116deecb2277ec5ae98139f93844bc09", + "sha256:a048dad5ed6ad1fad338c02c609b862dfaa921fcd065d747194a6805f91f2196", + "sha256:a1bd983c565f92779be456ece2479840ec39d386007cd4ae83382646293d681b", + "sha256:a66566f8a22561fc1a88dc87606c69b84fa9ce724f99522cf922c801ec68f5c1", + "sha256:bcb04ff12e79b28be6c9988f275e7ab69f01cc2ba319fb3114f87817bb7c74b6", + "sha256:bd24054aaf21e70a51e2a2a5ed1183560d3a69e6f9594a4bfe360a46f94eba83", + "sha256:be25cb93442c6d2f8702c599b51184bd3ccd83adebd08886b682173e09ef0c3f", + "sha256:c691b26283c3a31594683217d746f1dad59a7ae1d4cfc24626d7a064a11197d4", + "sha256:cc9d0dec711c914ed500f1d0d3822868760954dce98dfb0b7382a854aee55d19", + "sha256:ce2e5e04bb86da6187f96d7bab3f93a7877830981b37f0287dd6479e27a10341", + "sha256:ce651ca46d0202c302a535d3047c55a0131a720cf554a578fc1b8a2aff0e7d96", + "sha256:d0c8ebbfd439c37624db98f3877d9ed12c137cadd99dde2d2eae0dab0bbfc355", + "sha256:d675a876b295afa114ca8bf42d7f86b5fb1298e1b6bb9a24405a3f6c8338811c", + "sha256:dde3f3ed8d00c72631bc19cbfff8ad3b6215062a5eed402381ad365f82f0c18c", + "sha256:e5a31c07cea5edbaeb4bdba6f2b87db7d3dc0f446f379d907e51cc70ea375629", + "sha256:f514c2717012859ccb349c97862568fdc0479aad85b0270d6b5a6509dbc142e2", + "sha256:fc0db32f7223b094964e71729c0361f93db43664dd1ec86d3df217853cedda87", + "sha256:fd4fd83aa912d7b89b4b4a1580d30e2a4242f3936882a3f433586e5ab97ed0d5", + "sha256:feb5db446e96bfecfec078b943cc07744cc759893cef045aa8b8b6d6aaa8274e" + ], + "markers": "python_version >= '3.6'", + "version": "==8.3.2" + }, "pyarrow": { "hashes": [ "sha256:1832709281efefa4f199c639e9f429678286329860188e53beeda71750775923", @@ -211,6 +505,65 @@ ], "version": "==0.4.8" }, + "pycocotools": { + "hashes": [ + "sha256:24717a12799b4471c2e54aa210d642e6cd4028826a1d49fcc2b0e3497e041f1a" + ], + "markers": "platform_system == 'Linux'", + "version": "==2.0.2" + }, + "pycryptodome": { + "hashes": [ + "sha256:014c758af7fa38cab85b357a496b76f4fc9dda1f731eb28358d66fef7ad4a3e1", + "sha256:06162fcfed2f9deee8383fd59eaeabc7b7ffc3af50d3fad4000032deb8f700b0", + "sha256:0ca7a6b4fc1f9fafe990b95c8cda89099797e2cfbf40e55607f2f2f5a3355dcb", + "sha256:2a4bcc8a9977fee0979079cd33a9e9f0d3ddba5660d35ffe874cf84f1dd399d2", + "sha256:3c7ed5b07274535979c730daf5817db5e983ea80b04c22579eee8da4ca3ae4f8", + "sha256:4169ed515742425ff21e4bd3fabbb6994ffb64434472fb72230019bdfa36b939", + "sha256:428096bbf7a77e207f418dfd4d7c284df8ade81d2dc80f010e92753a3e406ad0", + "sha256:4ce6b09547bf2c7cede3a017f79502eaed3e819c13cdb3cb357aea1b004e4cc6", + "sha256:53989477044be41fa4a63da09d5038c2a34b2f4554cfea2e3933b17186ee9e19", + "sha256:621a90147a5e255fdc2a0fec2d56626b76b5d72ea9e60164c9a5a8976d45b0c9", + "sha256:6db1f9fa1f52226621905f004278ce7bd90c8f5363ffd5d7ab3755363d98549a", + "sha256:6eda8a3157c91ba60b26a07bedd6c44ab8bda6cd79b6b5ea9744ba62c39b7b1e", + "sha256:75e78360d1dd6d02eb288fd8275bb4d147d6e3f5337935c096d11dba1fa84748", + "sha256:7ff701fc283412e651eaab4319b3cd4eaa0827e94569cd37ee9075d5c05fe655", + "sha256:8f3a60926be78422e662b0d0b18351b426ce27657101c8a50bad80300de6a701", + "sha256:a843350d08c3d22f6c09c2f17f020d8dcfa59496165d7425a3fba0045543dda7", + "sha256:ae29fcd56152f417bfba50a36a56a7a5f9fb74ff80bab98704cac704de6568ab", + "sha256:ae31cb874f6f0cedbed457c6374e7e54d7ed45c1a4e11a65a9c80968da90a650", + "sha256:b33c9b3d1327d821e28e9cc3a6512c14f8b17570ddb4cfb9a52247ed0fcc5d8b", + "sha256:b59bf823cfafde8ef1105d8984f26d1694dff165adb7198b12e3e068d7999b15", + "sha256:bc3c61ff92efdcc14af4a7b81da71d849c9acee51d8fd8ac9841a7620140d6c6", + "sha256:ce81b9c6aaa0f920e2ab05eb2b9f4ccd102e3016b2f37125593b16a83a4b0cc2", + "sha256:d7e5f6f692421e5219aa3b545eb0cffd832cd589a4b9dcd4a5eb4260e2c0d68a", + "sha256:da796e9221dda61a0019d01742337eb8a322de8598b678a4344ca0a436380315", + "sha256:ead516e03dfe062aefeafe4a29445a6449b0fc43bc8cb30194b2754917a63798", + "sha256:ed45ef92d21db33685b789de2c015e9d9a18a74760a8df1fc152faee88cdf741", + "sha256:f19edd42368e9057c39492947bb99570dc927123e210008f2af7cf9b505c6892", + "sha256:f9bad2220b80b4ed74f089db012ab5ab5419143a33fad6c8aedcc2a9341eac70", + "sha256:fce7e22d96030b35345637c563246c24d4513bd3b413e1c40293114837ab8912", + "sha256:ffd0cac13ff41f2d15ed39dc6ba1d2ad88dd2905d656c33d8235852f5d6151fd" + ], + "markers": "python_version >= '2.7' and python_version not in '3.0, 3.1, 3.2, 3.3, 3.4'", + "version": "==3.11.0" + }, + "pyparsing": { + "hashes": [ + "sha256:c203ec8783bf771a155b207279b9bccb8dea02d8f0c9e5f8ead507bc3246ecc1", + "sha256:ef9d7589ef3c200abe66653d3f1ab1033c3c419ae9b9bdb1240a85b024efc88b" + ], + "markers": "python_version >= '2.6' and python_version not in '3.0, 3.1, 3.2, 3.3'", + "version": "==2.4.7" + }, + "pysocks": { + "hashes": [ + "sha256:08e69f092cc6dbe92a0fdd16eeb9b9ffbc13cadfe5ca4c7bd92ffb078b293299", + "sha256:2725bd0a9925919b9b51739eea5f9e2bae91e83288108a9ad338b2e3a4435ee5", + "sha256:3f8804571ebe159c380ac6de37643bb4685970655d3bba243530d6558b799aa0" + ], + "version": "==1.7.1" + }, "python-dateutil": { "hashes": [ "sha256:0123cacc1627ae19ddf3c27a5de5bd67ee4586fbdd6440d9748f8abb483d3e86", @@ -221,11 +574,11 @@ }, "python-dotenv": { "hashes": [ - "sha256:aae25dc1ebe97c420f50b81fb0e5c949659af713f31fdb63c749ca68748f34b1", - "sha256:f521bc2ac9a8e03c736f62911605c5d83970021e3fa95b37d769e2bbbe9b6172" + "sha256:14f8185cc8d494662683e6914addcb7e95374771e707601dfc70166946b4c4b8", + "sha256:bbd3da593fc49c249397cbfbcc449cf36cb02e75afc8157fcc6a81df6fb7750a" ], "index": "pypi", - "version": "==0.19.0" + "version": "==0.19.1" }, "python-levenshtein": { "hashes": [ @@ -277,6 +630,9 @@ "version": "==5.4.1" }, "requests": { + "extras": [ + "socks" + ], "hashes": [ "sha256:6c1246513ecd5ecd4528a0906f910e8f0f9c6b8ec72030dc9fd154dc1a6efd24", "sha256:b8aa58f8cf793ffd8782d3d8cb19e66ef36f7aba4353eec859e74678b01b07a7" @@ -312,6 +668,64 @@ "editable": true, "path": "." }, + "tabula-py": { + "hashes": [ + "sha256:784c37a9a46bc8b928cf31cef1d7ed1c9db8af19fb6bb1e63a481ecda0d169d1", + "sha256:9da61aa5d4256f79e7fa64d1fb09956d4c104d1a0116566c43bf9f612f37c149" + ], + "index": "pypi", + "version": "==2.3.0" + }, + "terminaltables": { + "hashes": [ + "sha256:f3eb0eb92e3833972ac36796293ca0906e998dc3be91fbe1f8615b331b853b81" + ], + "version": "==3.1.0" + }, + "torch": { + "hashes": [ + "sha256:06435080ba0a2c8f88b65af0550b973c5aa7771eacd9b17f69057fc7436a8ae2", + "sha256:1fb49ca0ca8edefbb3f47f6801482144c3a746ec21a65eb3f0839a1d8fb24705", + "sha256:335961a5c893f7b33b29aecbc19382a1a1b0106b3457a1c45148e1e14f8f5e09", + "sha256:351dda9f483486bec66ed838234e96f077e6886c88110bb1e2f4a708ed2356ce", + "sha256:35ec703bc535bde7e8790ab9500f02d4413d995ac981520501fde95e268781e1", + "sha256:42ca081a2e0e759844e70cad7efd8fcfb2f81634dffa73a226564eb83d989e5b", + "sha256:54dacb6a3f63c54334fadbf22fb6e9ee865085a4e0368962edff5babda057606", + "sha256:936d303c5e1d60259fb71d95a33e84d84fececa25a0fae112f6a23286ff183c8", + "sha256:a198332e2d344d25e423ae2df98d56d83060f19e9f4cf23164dffc8d403efeb8", + "sha256:b92f934b3c95578b3fd37cc06afca208d63f02b0d01b806e979cb4e46124a7f8", + "sha256:dd3ca91dc1a9fe3fbcddf035cb2fb8be44d57a527b845cd196ba69249adecccf", + "sha256:e470697006a4c08e4fb6a645e8ca49b0d36c8e7ccf413deef5161335bd7399f1" + ], + "index": "pypi", + "version": "==1.9.1" + }, + "torchvision": { + "hashes": [ + "sha256:1c186f42b4f8aa9a01c56c3a758693b0447aa169afb9fba0051177f8fecbd691", + "sha256:453e935212193e89b4bbb8d51082d8138631c2f8a420390284b1946d893df6eb", + "sha256:46a70a30ea7aeab63e67504778f2565fbb1c153fdd8e1a8c6a22193aec4dbddd", + "sha256:4ebffeee5468a0934952030eaba1de1dbb08154132235ee1d9049e41dfb1600d", + "sha256:6c8fe90213be4bce590ac9647b34db022d5d1ae94f309a733b9a64e65232173a", + "sha256:99d3e01e1d67d12bcc88e826431b70cad5b8e4729a277c04601f83358a120508", + "sha256:ac8dfbe4933013dda898b815e2476ebbc35e3a16b9352dfdd66e773c77755bec", + "sha256:bc99a984b162ee5626787eaee885d9fec1a5f16837f9d0c8223cca3269b9e47d", + "sha256:cd7e2b1a89d5a08f24325fc12441f5ba2822f407489377ac7841bf351a1f4d37", + "sha256:d6420bf21b9d0bdbabe55d64c8b11c61f8eb077948a55d5707946fcb17d97cec", + "sha256:d7c2d6c20244404fc9ca3568c88c305cb5a81d526d5912d52d22c64999bd4353", + "sha256:e504d9d51eae60a98925aee4a3fd58655abd5669659ad7431f7791a93af166fc" + ], + "index": "pypi", + "version": "==0.10.1" + }, + "tqdm": { + "hashes": [ + "sha256:8dd278a422499cd6b727e6ae4061c40b48fce8b76d1ccbf5d34fca9b7f925b0c", + "sha256:d359de7217506c9851b7869f3708d8ee53ed70a1b8edbba4dbcb47442592920d" + ], + "markers": "python_version >= '2.7' and python_version not in '3.0, 3.1, 3.2, 3.3'", + "version": "==4.62.3" + }, "trino": { "hashes": [ "sha256:67398bacffbcfbcbb8217769467f05c32eadd688c9aea6e301c1e2ba9be0052d", @@ -320,6 +734,14 @@ "index": "pypi", "version": "==0.306.0" }, + "typing-extensions": { + "hashes": [ + "sha256:49f75d16ff11f1cd258e1b988ccff82a3ca5570217d7ad8c5f48205dd99a677e", + "sha256:d8226d10bc02a29bcc81df19a26e56a9647f8b0a6d4a83924139f4a8b01f17b7", + "sha256:f1d25edafde516b146ecd0613dabcc61409817af4766fbbcfb8d1ad4ec441a34" + ], + "version": "==3.10.0.2" + }, "urllib3": { "hashes": [ "sha256:4987c65554f7a2dbf30c18fd48778ef124af6fab771a377103da0585e2336ece", @@ -327,6 +749,13 @@ ], "markers": "python_version >= '2.7' and python_version not in '3.0, 3.1, 3.2, 3.3, 3.4' and python_version < '4'", "version": "==1.26.7" + }, + "yapf": { + "hashes": [ + "sha256:408fb9a2b254c302f49db83c59f9aa0b4b0fd0ec25be3a5c51181327922ff63d", + "sha256:e3a234ba8455fe201eaa649cdac872d590089a18b661e39bbac7020978dd9c2e" + ], + "version": "==0.31.0" } }, "develop": { @@ -339,11 +768,11 @@ }, "anyio": { "hashes": [ - "sha256:0b993a2ef6c1dc456815c2b5ca2819f382f20af98087cc2090a4afed3a501436", - "sha256:c32da314c510b34a862f5afeaf8a446ffed2c2fde21583e654bd71ecfb5b744b" + "sha256:56ceaeed2877723578b1341f4f68c29081db189cfb40a97d1922b9513f6d7db6", + "sha256:8eccec339cb4a856c94a75d50fc1d451faf32a05ef406be462e2efc59c9838b0" ], "markers": "python_full_version >= '3.6.2'", - "version": "==3.3.2" + "version": "==3.3.3" }, "argon2-cffi": { "hashes": [ @@ -395,10 +824,10 @@ }, "certifi": { "hashes": [ - "sha256:2bbf76fd432960138b3ef6dda3dde0544f27cbf8546c458e60baf371917ba9ee", - "sha256:50b1e4f8446b06f41be7dd6338db18e0990601dce795c2b1686458aa7e8fa7d8" + "sha256:78884e7c1d4b00ce3cea67b44566851c4343c120abd683433ce934a68ea58872", + "sha256:d62a0163eb4c2344ac042ab2bdf75399a71a2d8c7d47eac2e2ee91b9d6339569" ], - "version": "==2021.5.30" + "version": "==2021.10.8" }, "cffi": { "hashes": [ @@ -460,68 +889,69 @@ }, "coverage": { "hashes": [ - "sha256:08fd55d2e00dac4c18a2fa26281076035ec86e764acdc198b9185ce749ada58f", - "sha256:11ce082eb0f7c2bbfe96f6c8bcc3a339daac57de4dc0f3186069ec5c58da911c", - "sha256:17983f6ccc47f4864fd16d20ff677782b23d1207bf222d10e4d676e4636b0872", - "sha256:25df2bc53a954ba2ccf230fa274d1de341f6aa633d857d75e5731365f7181749", - "sha256:274a612f67f931307706b60700f1e4cf80e1d79dff6c282fc9301e4565e78724", - "sha256:3dfb23cc180b674a11a559183dff9655beb9da03088f3fe3c4f3a6d200c86f05", - "sha256:43bada49697a62ffa0283c7f01bbc76aac562c37d4bb6c45d56dd008d841194e", - "sha256:4865dc4a7a566147cbdc2b2f033a6cccc99a7dcc89995137765c384f6c73110b", - "sha256:581fddd2f883379bd5af51da9233e0396b6519f3d3eeae4fb88867473be6d56e", - "sha256:5c191e01b23e760338f19d8ba2470c0dad44c8b45e41ac043b2db84efc62f695", - "sha256:6e216e4021c934246c308fd3e0d739d9fa8a3f4ea414f584ab90ef9c1592f282", - "sha256:72f8c99f1527c5a8ee77c890ea810e26b39fd0b4c2dffc062e20a05b2cca60ef", - "sha256:7593a49300489d064ebb6c58539f52cbbc4a2e6a4385de5e92cae1563f88a425", - "sha256:7844a8c6a0fee401edbf578713c2473e020759267c40261b294036f9d3eb6a2d", - "sha256:7af2f8e7bb54ace984de790e897f858e88068d8fbc46c9490b7c19c59cf51822", - "sha256:7dbda34e8e26bd86606ba8a9c13ccb114802e01758a3d0a75652ffc59a573220", - "sha256:82b58d37c47d93a171be9b5744bcc96a0012cbf53d5622b29a49e6be2097edd7", - "sha256:8305e14112efb74d0b5fec4df6e41cafde615c2392a7e51c84013cafe945842c", - "sha256:8426fec5ad5a6e8217921716b504e9b6e1166dc147e8443b4855e329db686282", - "sha256:88f1810eb942e7063d051d87aaaa113eb5fd5a7fd2cda03a972de57695b8bb1a", - "sha256:8da0c4a26a831b392deaba5fdd0cd7838d173b47ce2ec3d0f37be630cb09ef6e", - "sha256:a9dbfcbc56d8de5580483cf2caff6a59c64d3e88836cbe5fb5c20c05c29a8808", - "sha256:aa5d4d43fa18cc9d0c6e02a83de0b9729b5451a9066574bd276481474f0a53ab", - "sha256:adb0f4c3c8ba8104378518a1954cbf3d891a22c13fd0e0bf135391835f44f288", - "sha256:b4ee5815c776dfa3958ba71c7cd4cdd8eb40d79358a18352feb19562fe4408c4", - "sha256:b5dd5ae0a9cd55d71f1335c331e9625382239b8cede818fb62d8d2702336dbf8", - "sha256:b78dd3eeb8f5ff26d2113c41836bac04a9ea91be54c346826b54a373133c8c53", - "sha256:bea681309bdd88dd1283a8ba834632c43da376d9bce05820826090aad80c0126", - "sha256:befb5ffa9faabef6dadc42622c73de168001425258f0b7e402a2934574e7a04b", - "sha256:d795a2c92fe8cb31f6e9cd627ee4f39b64eb66bf47d89d8fcf7cb3d17031c887", - "sha256:d82cbef1220703ce56822be7fbddb40736fc1a928ac893472df8aff7421ae0aa", - "sha256:e63490e8a6675cee7a71393ee074586f7eeaf0e9341afd006c5d6f7eec7c16d7", - "sha256:e735ab8547d8a1fe8e58dd765d6f27ac539b395f52160d767b7189f379f9be7a", - "sha256:fa816e97cfe1f691423078dffa39a18106c176f28008db017b3ce3e947c34aa5", - "sha256:fff04bfefb879edcf616f1ce5ea6f4a693b5976bdc5e163f8464f349c25b59f0" + "sha256:07efe1fbd72e67df026ad5109bcd216acbbd4a29d5208b3dab61779bae6b7b26", + "sha256:0898d6948b31df13391cd40568de8f35fa5901bc922c5ae05cf070587cb9c666", + "sha256:0a7e55cc9f7efa22d5cc9966276ec7a40a8803676f6ccbfdc06a486fba9aa9ee", + "sha256:17426808e8e0824f864876312d41961223bf5e503bf8f1f846735279a60ea345", + "sha256:1770d24f45f1f2daeae34cfa3b33fcb29702153544cd2ad40d58399dd4ff53b5", + "sha256:1864bdf9b2ccb43e724051bc23a1c558daf101ad4488ede1945f2a8be1facdad", + "sha256:2c5f39d1556e75fc3c4fb071f9e7cfa618895a999a0de763a541d730775d0d5f", + "sha256:3490ff6dbf3f7accf0750136ed60ae1f487bccc1f097740e3b21262bc9c89854", + "sha256:353a50f123f0185cdb7a1e1e3e2cfb9d1fd7e293cfaf68eedaf5bd8e02e3ec32", + "sha256:3edbb3ec580c73e5a264f5d04f30245bc98eff1a26765d46c5c65134f0a0e2f7", + "sha256:4eb9cd910ca8e243f930243a9940ea1a522e32435d15668445753d087c30ee12", + "sha256:5b06f4f1729e2963281d9cd6e65e6976bf27b44d4c07ac5b47223ce45f822cec", + "sha256:5b1ceacb86e0a9558061dcc6baae865ed25933ea57effea644f21657cdce19bc", + "sha256:65da6e3e8325291f012921bbf71fea0a97824e1c573981871096aac6e2cf0ec5", + "sha256:66fe33e9e0df58675e08e83fe257f89e7f625e7633ea93d0872154e09cce2724", + "sha256:6873f3f954d3e3ab8b1881f4e5307cc19f70c9f931c41048d9f7e6fd946eabe7", + "sha256:73880a80fad0597eca43e213e5e1711bf6c0fcdb7eb6b01b3b17841ebe5a7f8d", + "sha256:7600fac458f74c68b097379f76f3a6e3a630493fc7fc94b6508fedd9d498c194", + "sha256:83682b73785d2e078e0b5f63410b8125b122e1a22422640c57edd4011c950f3e", + "sha256:83faa3692e8306b20293889714fdf573d10ef5efc5843bd7c7aea6971487bd6a", + "sha256:9c416ba03844608f45661a5b48dc59c6b5e89956efe388564dd138ca8caf540b", + "sha256:9d242a2434801ef5125330deddb4cddba8990c9a49b3dec99dca17dd7eefba5a", + "sha256:a2e15ab5afbee34abf716fece80ea33ea09a82e7450512f022723b1a82ec9a4e", + "sha256:abe8207dfb8a61ded9cd830d26c1073c8218fc0ae17eb899cfe8ec0fafae6e22", + "sha256:ad7182a82843f9f85487f44567c8c688f16c906bdb8d0e44ae462aed61cb8f1b", + "sha256:b45f89a8ef65c29195f8f28dbe215f44ccb29d934f3e862d2a5c12e38698a793", + "sha256:b81a4e667c45b13658b84f9b8f1d32ef86d5405fabcbd181b76b9e51d295f397", + "sha256:c9c413c4397d4cdc7ca89286158d240ce524f9667b52c9a64dd7e13d16cf8815", + "sha256:e11cca9eb5c9b3eaad899728ee2ce916138399ee8cbbccaadc1871fecb750827", + "sha256:e66c50f0ab445fec920a9f084914ea1776a809e3016c3738519048195f851bbb", + "sha256:ea452a2d83964d08232ade470091015e7ab9b8f53acbec10f2210fbab4ce7e43", + "sha256:f398d38e6ebc2637863db1d7be3d4f9c5174e7d24bb3b0716cdb1f204669cbcf", + "sha256:f82a17f2a77958f3eef40ad385fc82d4c6ba9a77a51a174efe03ce75daebbc16" ], "index": "pypi", - "version": "==6.0" + "version": "==6.0.1" }, "debugpy": { "hashes": [ - "sha256:0c523fcbb6fb395403ee8508853767b74949335d5cdacc9f83d350670c2c0db2", - "sha256:135a77ac1a8f6ea49a69928f088967d36842bc492d89b45941c6b19222cffa42", - "sha256:2019ffcd08d7e643c644cd64bee0fd53c730cb8f15ff37e6a320b5afd3785bfa", - "sha256:3e4de96c70f3398abd1777f048b47564d98a40df1f72d33b47ef5b9478e07206", - "sha256:4d53fe5aecf03ba466aa7fa7474c2b2fe28b2a6c0d36688d1e29382bfe88dd5f", - "sha256:5ded60b402f83df46dee3f25ae5851809937176afdafd3fdbaab60b633b77cad", - "sha256:7c15014290150b76f0311debf7fbba2e934680572ea60750b0f048143e873b3e", - "sha256:7e7210a3721fc54b52d8dc2f325e7c937ffcbba02b808e2e3215dcbf0c0b8349", - "sha256:847926f78c1e33f7318a743837adb6a9b360a825b558fd21f9240ba518fe1bb1", - "sha256:88b17d7c2130968f75bdc706a33f46a8a6bb90f09512ea3bd984659d446ee4f4", - "sha256:8d488356cc66172f1ea29635fd148ad131f13fad0e368ae03cc5c0a402372756", - "sha256:ab3f33499c597a2ce454b81088e7f9d56127686e003c4f7a1c97ad4b38a55404", - "sha256:c0fd1a66e104752f86ca2faa6a0194dae61442a768f85369fc3d11bacff8120f", - "sha256:c3d7db37b7eb234e49f50ba22b3b1637e8daadd68985d9cd35a6152aa10faa75", - "sha256:c9665e58b80d839ae1b0815341c63d00cae557c018f198c0b6b7bc5de9eca144", - "sha256:dbda8f877c3dec1559c01c63a1de63969e51a4907dc308f4824238bb776026fe", - "sha256:f3dcc294f3b4d79fdd7ffe1350d5d1e3cc29acaec67dd1c43143a43305bbbc91", - "sha256:f907941ad7a460646773eb3baae4c88836e9256b390dfbfae8d92a3d3b849a7d" + "sha256:098753d30232d1e4264eee37e1ddd5d106dc5c4bc6d8d7f4dadad9e44736cd48", + "sha256:1283e418f595262d11abc5fae6a3ac629c5fc3b44d3988511ea755414aab3062", + "sha256:33e8a9b4949be8b4f5fcfff07e24bd63c565060659f1c79773c08d19eee012f2", + "sha256:72093ea83226d5264b3697b948c07a3cfcc4953da14a78a50c4e623a2bb99ad8", + "sha256:77b5233b23a248cd930bf03ecd684da065c6e7d2a57d137516b6fa1698a58317", + "sha256:82c4fa1293981a28c435d196a3714e06df761daff0da3336234475ceff1b042c", + "sha256:86febd61fc351cee926060eef008e242b7259957d71d25eef82860d0cc59b4dc", + "sha256:8e7391a08a351adce6e5154ed35e4cf90c5f3c10dbf7c8f6a234faef300588d6", + "sha256:990228f15de4ccbc52c2accf41a63b3b8d0a01e3de9876e02e77e487c4b1ffab", + "sha256:9f3bed64027bd80a8fe1f35491ec0ec2d2c85f1e63dac7c0311e400bfe58cf05", + "sha256:a03051ba4fdf6720ee83a42e9f803e3a0b69a48b00436b97d16aeda49d28a8bf", + "sha256:be7ca2baef5a634dfbd086d9c1d6b5e0783c6d0f6d0a004b43d36f625d4fc0a9", + "sha256:c3184666cfe1768bf110f8075bafea59d2afce3cc54f4c501f2371c7238bc69d", + "sha256:cdaf6baaf8176644e752aed321b3f810dcf8b0439709f7edd9ae542f849a639b", + "sha256:ce0794d50391c87813bb148548c34dc638fb4d58198d275334968f63c088aa69", + "sha256:dacdb0a3377063d638bd8736c80b7274ae341ce778fec0f883ef1cbb79538bf2", + "sha256:dd0e8d5e099444c22b27511dafd48e8bdcd7051b811ddd0ab2062965fe36ac80", + "sha256:de56775b3dbbfc02bc9fb0682da4a960e0a5bada699eac5e22e0723c4107ec9f", + "sha256:ef71eb8eb276370f8e74ab3f8c7648bbdc9aabac814a5b2840c8dd38a7bc7251", + "sha256:f058c204341fd7ff800ee0edafc106ca0fb1c9857e8a8895a6e04cca3ddcb7bf", + "sha256:fda623aa1036b34d554a1225a09cae6bf02b06c0ad903a9f0b8ac3cb74eddc15" ], "markers": "python_version >= '2.7' and python_version not in '3.0, 3.1, 3.2, 3.3, 3.4'", - "version": "==1.4.3" + "version": "==1.5.0" }, "decorator": { "hashes": [ @@ -558,11 +988,11 @@ }, "flake8": { "hashes": [ - "sha256:07528381786f2a6237b061f6e96610a4167b226cb926e2aa2b6b1d78057c576b", - "sha256:bf8fd333346d844f616e8d47905ef3a3384edae6b4e9beb0c5101e25e3110907" + "sha256:479b1304f72536a55948cb40a32dce8bb0ffe3501e26eaf292c7e60eb5e0428d", + "sha256:806e034dda44114815e23c16ef92f95c91e4c71100ff52813adf7132a6ad870d" ], "index": "pypi", - "version": "==3.9.2" + "version": "==4.0.1" }, "idna": { "hashes": [ @@ -613,11 +1043,11 @@ }, "jinja2": { "hashes": [ - "sha256:1f06f2da51e7b56b8f238affdd6b4e2c61e39598a378cc49345bc1bd42a978a4", - "sha256:703f484b47a6af502e743c9122595cc812b0271f661722403114f71a79d0f5a4" + "sha256:827a0e32839ab1600d4eb1c4c33ec5a8edfbc5cb42dafa13b81f182f97784b45", + "sha256:8569982d3f0889eed11dd620c706d39b60c36d6d25843961f33f77fb6bc6b20c" ], "markers": "python_version >= '3.6'", - "version": "==3.0.1" + "version": "==3.0.2" }, "json5": { "hashes": [ @@ -628,19 +1058,19 @@ }, "jsonschema": { "hashes": [ - "sha256:48f4e74f8bec0c2f75e9fcfffa264e78342873e1b57e2cfeae54864cc5e9e4dd", - "sha256:9938802041347f2c62cad2aef59e9a0826cd34584f3609db950efacb4dbf6518" + "sha256:2b3cca28580511d44326f0e7fc582eab3cbe31aabd1a1c2cfa74a399796ffd84", + "sha256:9dd7c33b4a96138dc37bb86b3610d3b12d30d96433d4d73435ca3025804154a8" ], "markers": "python_version >= '3.7'", - "version": "==4.0.1" + "version": "==4.1.0" }, "jupyter-client": { "hashes": [ - "sha256:124a6e6979c38999d9153b1c4d1808c4c820a45066d5ed1857a5b59c04ffccb3", - "sha256:382aca66dcaf96d7eaaa6c546d57cdf8b3b1cf5bc1f2704c58a1d8d244f1163d" + "sha256:074bdeb1ffaef4a3095468ee16313938cfdc48fc65ca95cc18980b956c2e5d79", + "sha256:8b6e06000eb9399775e0a55c52df6c1be4766666209c22f90c2691ded0e338dc" ], "markers": "python_full_version >= '3.6.1'", - "version": "==7.0.5" + "version": "==7.0.6" }, "jupyter-core": { "hashes": [ @@ -652,19 +1082,19 @@ }, "jupyter-server": { "hashes": [ - "sha256:827c134da7a9e09136c2dc2fd16743350970105247f085abfc6ce0432d0c979e", - "sha256:8ab4f484a4a2698f757cff0769d27b5d991e0232a666d54f4d6ada4e6a61330b" + "sha256:618aba127b1ff35f50e274b6055dfeff006a6008e94d4e9511c251a2d99131e5", + "sha256:ab7ab1cc38512f15026cbcbb96300fb46ec8b24aa162263d9edd00e0a749b1e8" ], "markers": "python_version >= '3.6'", - "version": "==1.11.0" + "version": "==1.11.1" }, "jupyterlab": { "hashes": [ - "sha256:1241ff4ab8604a281eda5d8215fe59e418737edcdfe71df09a0bd5fdd4ccfd2c", - "sha256:13174cb6076dd5da6f1b85725ccfcc9518d8f98e86b8b644fc89b1dfaeda63a9" + "sha256:3bedbc732ae86b616bd5c7855a6d071fe76ad47186378d36df77f4fc58ae322a", + "sha256:a43733acc3729557fc4758cff55652e52896e42c64c1f12540656ae7f298b806" ], "index": "pypi", - "version": "==3.1.14" + "version": "==3.1.18" }, "jupyterlab-pygments": { "hashes": [ @@ -876,11 +1306,11 @@ }, "pycodestyle": { "hashes": [ - "sha256:514f76d918fcc0b55c6680472f0a37970994e07bbb80725808c17089be302068", - "sha256:c389c1d06bf7904078ca03399a4816f974a1d590090fecea0c63ec26ebaf1cef" + "sha256:720f8b39dde8b293825e7ff02c475f3077124006db4f440dcbc9a20b76548a20", + "sha256:eddd5847ef438ea1c7870ca7eb78a9d47ce0cdb4851a5523949f2601d0cbbe7f" ], - "markers": "python_version >= '2.7' and python_version not in '3.0, 3.1, 3.2, 3.3'", - "version": "==2.7.0" + "markers": "python_version >= '2.7' and python_version not in '3.0, 3.1, 3.2, 3.3, 3.4'", + "version": "==2.8.0" }, "pycparser": { "hashes": [ @@ -892,11 +1322,11 @@ }, "pyflakes": { "hashes": [ - "sha256:7893783d01b8a89811dd72d7dfd4d84ff098e5eed95cfa8905b22bbffe52efc3", - "sha256:f5bc8ecabc05bb9d291eb5203d6810b49040f6ff446a756326104746cc00c1db" + "sha256:05a85c2872edf37a4ed30b0cce2f6093e1d0581f8c19d7393122da7e25b2b24c", + "sha256:3bb3a3f256f4b7968c9c788781e4ff07dce46bdf12339dcda61053375426ee2e" ], "markers": "python_version >= '2.7' and python_version not in '3.0, 3.1, 3.2, 3.3'", - "version": "==2.3.1" + "version": "==2.4.0" }, "pygments": { "hashes": [ @@ -1000,6 +1430,9 @@ "version": "==22.3.0" }, "requests": { + "extras": [ + "socks" + ], "hashes": [ "sha256:6c1246513ecd5ecd4528a0906f910e8f0f9c6b8ec72030dc9fd154dc1a6efd24", "sha256:b8aa58f8cf793ffd8782d3d8cb19e66ef36f7aba4353eec859e74678b01b07a7" diff --git a/data/annotations/ESG/20201030 1Qbit aggregated_annotations_needs_correction.xlsx b/data/annotations/ESG/20201030 1Qbit aggregated_annotations_needs_correction.xlsx new file mode 100755 index 0000000..de5c0a2 Binary files /dev/null and b/data/annotations/ESG/20201030 1Qbit aggregated_annotations_needs_correction.xlsx differ diff --git a/data/extraction/esg_TEXT_dataset.csv b/data/extraction/esg_TEXT_dataset.csv new file mode 100644 index 0000000..8109988 --- /dev/null +++ b/data/extraction/esg_TEXT_dataset.csv @@ -0,0 +1,665 @@ +,question,context,company,source_file,source_page,kpi_id,year,answer,data_type,relevant_paragraphs,annotator,label +0,What is the company name?, Enova is a state enterprise owned by the Ministry of Climate and ,Cabot Oil & Gas Corp,Cabot Oil & Gas Corp Annual Report 2018.pdf,[3],0.0,2018,Cabot Oil & Gas Corporation,TEXT,"[""Cabot Oil & Gas Corporation, headquartered in Houston, Texas, is an independent oil and gas producer. The Company's focused operations are centered around developing its natural gas resources in northeast Pennsylvania.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +1,What is the company name?, IPCC (2018): Global Warming of 1.5 C IPCC (2019): Climate Change and Land IPCC (2019): Special Report on the Ocean and Cryosphere in a Changing Climate,OMV,Sustainability Report 2014_EN.pdf,[77],0.0,2014,OMV Aktiengesellschaft,TEXT,"[""Owner and publisher OMV Aktiengesellschaft Head Office Trabrennstraße 6-8 1020 Vienna, Austria info.sustainability@omv.com""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +2,What is the company name?,1 The US national hydraulic fracturing chemical registry.,Lundin Energy AB,ar_2019_e.pdf,[1],0.0,2019,Lundin Petroleum,TEXT,"[""Lundin Petroleum ""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +3,What is the company name?,2019 Serious incident frequency (SIF - per million hours worked),"Aktsionernoe Obshchestvo Rosneftegaz, Moscow",annual 2015.pdf,[1],0.0,2015,Rosneft,TEXT,"[""ROSNEFT""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +4,What is the company name?,"A Delaware corporation formed in 1971 and publicly held since 1988, Devon (NYSE: DVN) is an independent energy company engaged primarily in the exploration, development and production of oil, natural gas and NGLs. Our operations are concentrated in various North American onshore areas in the U.S. and Canada. In July 2018, we exited the midstream business by divesting our aggregate ownership interests in EnLink and the General Partner.",Devon,NYSE_DVN_2018.pdf,[6],0.0,2018,Devon,TEXT,"[""A Delaware corporation formed in 1971 and publicly held since 1988, Devon (NYSE: DVN) is an +independent energy company engaged primarily in the exploration, development and production of oil, natural gas +and NGLs. Our operations are concentrated in various North American onshore areas in the U.S. and Canada. In +July 2018, we exited the midstream business by divesting our aggregate ownership interests in EnLink and the +General Partner.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +5,What is the company name?,"A key player in the energy transition, EDF group is an integrated energy company, active in all areas of the business: generation, transmission, distribution, trading, energy supply and energy services. As a global leader in low-carbon energy, the Group has developed a diversified generation mix based on nuclear power, thermal energy, hydropower and other renewable energies.",EDF,EDF-ddr-2018-en.pdf,[3],0.0,2018,EDF Group,TEXT,"[""A key player in the energy transition, EDF group is an integrated energy company, active in all areas of the business: generation, transmission, distribution, trading, energy supply and energy services. As a global leader in low-carbon energy, the Group has developed a diversified generation mix based on nuclear power, thermal energy, hydropower and other renewable energies.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +6,What is the company name?,"A particular challenge is the invasive sun coral, which is currently spreading along the Brazilian coastline and competing with native coral species. To control the presence of this invasive species in the Peregrino field, a risk tool has been developed to assess the potential of vessels operating in the field spreading corals, so that relevant mitigating actions can be taken. ",Ameren Corporation,Ameren Corporation Climate Risk Report 2019.pdf,[1],0.0,2019,Ameren,TEXT,"[""Ameren""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +7,What is the company name?,AKER BP ASA,Aker BP,AKERBP-Annual-Report-2017.pdf,[1],0.0,2017,Aker BP,TEXT,"[""AKER BP ASA""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +8,What is the company name?,About the Company NOVATEK is one of the largest independent natural gas producers in Russia,NOVATEK,04_NOVATEK_AR_2016_ENG_11.pdf,[3],0.0,2016,NOVATEK,TEXT,"[""About the Company NOVATEK is one of the largest independent natural gas producers in Russia""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +9,What is the company name?,"About this report This report covers the operations of OMV Group, headquartered in Vienna, Austria, for the 2016 business year.",OMV,Sustainability Report 2016_EN.pdf,[2],0.0,2016,OMV Group,TEXT,"[""About this report This report covers the operations of OMV Group, headquartered in Vienna, Austria, for the 2016 business year.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +10,What is the company name?,"About this report This report covers the operations of OMV Group, headquartered in Vienna, Austria, for the 2017 business year.",OMV,Sustainability Report 2017_EN.pdf,[2],0.0,2017,OMV Group,TEXT,"[""About this report This report covers the operations of OMV Group, headquartered in Vienna, Austria, for the 2017 business year.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +11,What is the company name?,"About this report This report covers the sustainability operations of OMV Group, headquartered in Vienna, Austria, for the 2015 business year.",OMV,Sustainability Report 2015_EN.pdf,[2],0.0,2015,OMV Group,TEXT,"[""About this report This report covers the sustainability operations of OMV Group, headquartered in Vienna, Austria, for the 2015 business year.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +12,What is the company name?,"Actions to improve safety and security In 2019, safety initiatives were implemented through the company-wide improvement project: Safety beyond 2020. The goal has been to further strengthen the safety culture and performance through risk awareness and proactive behaviour at all organisational levels. The project builds on the existing I am Safety governance, which highlights that individuals are personally accountable for safety. Four main areas for improvement have been identified: safety visibility, leadership and behaviour, safety indicators and learning and follow-up.",University of Portsmouth,University of Plymouth Sustainability_Report_2018.pdf,[3],0.0,2018,University of Plymouth,TEXT,"[""Welcome to the University of Plymouth's fifth Sustainability Report""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +13,What is the company name?,Adani Enterprises Limited,Adani,Adani Group Adani Enterprises Annual Report 2019.pdf,[1],0.0,2018-19,Adani Enterprises Limited,TEXT,"[""Adani Enterprises Limited""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +14,What is the company name?,Adani Power Limited,Adani,Adani Group Adani Power Annual Report 2019.pdf,[1],0.0,2018-19,Adani Power Limited,TEXT,"[""Adani Power Limited""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +15,What is the company name?,"Additional information, including information on factors that may affect Equinor’s business, is contained in Equinor’s latest Annual Report and Form 20-F, filed with the U.S. Securities and Exchange Commission (and section Risk review – Risk factors thereof), which is available at Equinor’s website (www.equinor.com).",Dominion Energy,2018-summary-annual-report.pdf,[8],0.0,2018,Dominion Energy,TEXT,"[""For longer than a century, our stakeholders have relied on Dominion +Energy to provide stability in a changing world. By living our core +values ""” as they are embedded in our corporate culture ""” we have +provided safe, reliable and affordable energy to meet the needs +of our customers and communities, as well as the expectations of +our investors.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +16,What is the company name?,Aker BP,Aker BP,Aker-BP-Annual-report-2018.pdf,[1],0.0,2018,Aker BP,TEXT,"[""Aker BP""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +17,What is the company name?,AkerBP,Aker BP,AKERBP-Annual-Report-2016.pdf,[1],0.0,2016,Aker BP,TEXT,"[""AkerBP""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +18,What is the company name?,Always safe - Responsible operations Always safe - Responsible operations,RWE,RWE-csr_overall-report-2019.pdf,[26],0.0,2019,RWE AG,TEXT,"[""The CR Report of RWE AG is published as a GRI Report and conforms with the GRI Standards (2016) of the Global Reporting Initiative in a selection based on a Materiality Analysis of the topics relevant for our business.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +19,What is the company name?,Always safe Responsible operations Safety is our first priority ,BP,bp-annual-report-and-form-20f-2019.pdf,[1],0.0,2019,BP,TEXT,"[""BP Annual Report and Form 20-F 2019""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +20,What is the company name?,Ameren,Ameren Corporation,Ameren_2019_Annual_Report.pdf,[1],0.0,2019,Ameren,TEXT,"[""Ameren""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +21,What is the company name?,"Annual Report and Form 20-F for the year ended December 31, 2018, Royal Dutch Shell plc",Royal Dutch Shell plc,shell_annual_report_2018.pdf,[1],0.0,2018,Royal Dutch Shell plc,TEXT,"[""Annual Report and Form 20-F for the year ended December 31, 2018, Royal Dutch Shell plc""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +22,What is the company name?,"Anti-bribery and corruption - Our Code of Conduct explicitly prohibits engaging in bribery and corruption in any form. Equinor’s Anti-Corruption Compliance Program summarises the standards, requirements and procedures implemented to comply with applicable laws and regulations and maintaining our high ethical standards. Our group-wide policy ensures that anti-bribery and corruption risks are identified, and measures are taken to mitigate risk in all parts of the organisation and that concerns are reported. We maintain a global network of compliance officers responsible for ensuring that ethical and anti- corruption considerations are integrated into Equinor activities no matter where they take place. ",Cenovus Energy,Cenovus Annual Report 2017.pdf,[1],0.0,2017,Cenovus Energy,TEXT,"[""cenovus ENERGY""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +23,What is the company name?,"Approach Resources Inc. is an independent energy company focused on the exploration, development, production and acquisition of unconventional oil and gas reserves in the Midland Basin of the greater Permian Basin in West Texas, where we lease approximately 149,000 net acres as of December 31, 2017. We believe our concentrated acreage position and extensive, integrated field infrastructure system provides us an opportunity to achieve cost, operating and recovery efficiencies in the development of our drilling inventory. Our long-term business strategy is to develop resource potential from the Wolfcamp shale oil formation and pursue acquisitions that meet our strategic and financial objectives. See — Our Business Strategy below. Additional drilling targets could include the Clearfork, Canyon Sands, Strawn and Ellenburger zones. We sometimes refer to our development project in the Permian Basin as Project Pangea, which includes Pangea West. Our management and technical team have a proven track record of finding and developing reserves through advanced drilling and completion techniques. As the operator of all of our estimated proved reserves and production, we have a high degree of control over capital expenditures and other operating matters.",Approach Resources Inc,NASDAQ_AREX_2017 annual.pdf,[9],0.0,2017,Approach Resources Inc.,TEXT,"[""Approach Resources Inc. is an independent energy company focused on the exploration, development, +production and acquisition of unconventional oil and gas reserves in the Midland Basin of the greater Permian Basin +in West Texas, where we lease approximately 149,000 net acres as of December 31, 2017. We believe our +concentrated acreage position and extensive, integrated field infrastructure system provides us an opportunity to +achieve cost, operating and recovery efficiencies in the development of our drilling inventory. Our long-term +business strategy is to develop resource potential from the Wolfcamp shale oil formation and pursue acquisitions +that meet our strategic and financial objectives. See “— Our Business Strategy” below. Additional drilling targets +could include the Clearfork, Canyon Sands, Strawn and Ellenburger zones. We sometimes refer to our development +project in the Permian Basin as “Project Pangea,” which includes “Pangea West.” Our management and technical +team have a proven track record of finding and developing reserves through advanced drilling and completion +techniques. As the operator of all of our estimated proved reserves and production, we have a high degree of control +over capital expenditures and other operating matters.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +24,What is the company name?,"As I look back on the past two decades, they are largely defined by rapid advancements in technology. From consumer and industrial goods to healthcare and financial services, advancements in technology have reshaped and disrupted industries, while also creating new opportunities for those with the acumen to innovate and successfully execute on a vision. Twenty years ago, in May of 2000, we launched Intercontinental Exchange, a name we chose to reflect our vision of better serving global markets through our innovative, web-based, technology platform. We aspired to create a more transparent market that was easily accessible to all participants. In the years since, our focus on leading technology, customer-driven product innovation and operating efficiency has remained core to our strategy. We have built new technology from scratch; we have acquired old technology and refurbished it; and we have innovated, developing countless new products and content that seamlessly flow through a global distribution platform. It is our operating expertise, leading technology infrastructure and innovative culture that underpin the quality of the networks we operate and, ultimately, have proven to be our most valuable competitive advantages.",Intercontinental Exchange,2019-Annual-Report_Web_BMK_vF.pdf,[2],0.0,2019,Intercontinental Exchange,TEXT,"[""As I look back on the past two decades, they are largely defined by rapid +advancements in technology. From consumer and industrial goods to +healthcare and financial services, advancements in technology have +reshaped and disrupted industries, while also creating new opportunities +for those with the acumen to innovate and successfully execute on a +vision. Twenty years ago, in May of 2000, we launched Intercontinental +Exchange, a name we chose to reflect our vision of better serving global +markets through our innovative, web-based, technology platform. We +aspired to create a more transparent market that was easily accessible +to all participants. In the years since, our focus on leading technology, +customer-driven product innovation and operating efficiency has +remained core to our strategy. We have built new technology from +scratch; we have acquired old technology and refurbished it; and we +have innovated, developing countless new products and content that +seamlessly flow through a global distribution platform. It is our +operating expertise, leading technology infrastructure and innovative +culture that underpin the quality of the networks we operate and, +ultimately, have proven to be our most valuable competitive advantages.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +25,What is the company name?,"At Ervia we have a pivotal role to play in enhancing the environment, leading the transition to a low carbon energy system, protecting precious water resources and increasing resilience.",Ervia,Ervia-Annual-Report-2018.pdf,[4],0.0,2018,Ervia,TEXT,"[""At Ervia we have a pivotal role to play +in enhancing the environment, leading +the transition to a low carbon energy +system, protecting precious water +resources and increasing resilience.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +26,What is the company name?,"Australia As part of planning for the Stromlo-1 exploration drilling programme in the Great Australian Bight, a comprehensive Environmental Plan (EP) was finalised and submitted to the authorities in 2019. The EP, which took two years to develop, was accepted by the regulator in December 2019. The work included co-funding extensive baseline surveying of the deep-water environments and the met-ocean conditions of the Great Australian Bight. More information about the EP and related engagement activities is found in the Respecting human rights chapter in this report and on our web-site. ",OMV,dload_Sustainability Report 2018_en.pdf,[2],0.0,2018,OMV,TEXT,"[""Welcome to OMV's 2018 Sustainability Report""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +27,What is the company name?,BASF Report 2015,BASF SE,2015_BASF_Report.pdf,[1],0.0,2015,BASF,TEXT,"[""BASF Report 2015""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +28,What is the company name?,BASF Report 2016,BASF SE,BASF_Report_2016.pdf,[1],0.0,2016,BASF,TEXT,"[""BASF Report 2016""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +29,What is the company name?,BASF Report 2017,BASF SE,BASF_Report_2017.pdf,[1],0.0,2017,BASF,TEXT,"[""BASF Report 2017""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +30,What is the company name?,BASF Report 2018,BASF SE,BASF_Report_2018.pdf,[1],0.0,2018,BASF,TEXT,"[""BASF Report 2018""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +31,What is the company name?,BOARD OF DIRECTORS AND statutory AUDITORS OF SAIPEM SpA,Saipem SpA,Annual-report-2019.pdf,[2],0.0,2019,SAIPEM SpA,TEXT,"[""BOARD OF DIRECTORS AND statutory AUDITORS OF SAIPEM SpA""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +32,What is the company name?,BP Annual Report and Form 20-F 2018,BP,bp-annual-report-and-form-20f-2018.pdf,[1],0.0,2018,BP,TEXT,"[""BP Annual Report and Form 20-F 2018""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +33,What is the company name?,BP Annual Report and Form 20-F 2019,BP,bp-annual-report-and-form-20f-2019.pdf,[1],0.0,2019,BP,TEXT,"[""BP Annual Report and Form 20-F 2019""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +34,What is the company name?,BP Sustainability Report 2017,BP,bp-sustainability-report-2017.pdf,[1],0.0,2017,BP,TEXT,"[""BP Sustainability Report 2017""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +35,What is the company name?,BP Sustainability Report 2018,BP,bp-sustainability-report-2018.pdf,[1],0.0,2018,BP,TEXT,"[""BP Sustainability Report 2018""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +36,What is the company name?,BP Sustainability Report 2019,BP,bp-sustainability-report-2019.pdf,[1],0.0,2019,BP,TEXT,"[""BP Sustainability Report 2019""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +37,What is the company name?,Board of Directors and auditors of Saipem SpA,Saipem SpA,ANNUAL REPORT 2017.pdf,[2],0.0,2017,Saipem SpA,TEXT,"[""Board of Directors and auditors of Saipem SpA""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +38,What is the company name?,"Board of Directors’ Safety, Sustainability and Ethics committee.",ENDESA,Endesa SA Annual Report 2018.pdf,[3],0.0,2018,ENDESA,TEXT,"[""ENDESA, S.A. Financial Statements for the year ended 31 December 2018 5 ENDESA, S.A. and Subsidiaries Consolidated Financial Statements for the year ended 31 December 2018 207""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +39,What is the company name?,"Brazil As a major offshore operator, it is particularly relevant for Equinor to keep close engagement with fisheries. Fishermen operating offshore Brazil are impacted by our offshore activities through the regulatory prohibition on fishing near offshore installations. During 2019, Equinor and partners were responsible for training approximately 300 local fishermen to act as response teams in the event of an oil spill at sea, with the purpose of ensuring the safety and protection of marine and coastal environments. The process has resulted in formal certifications for the fishermen and their vessels, creating positive safety results and expanded livelihood opportunities for the fishing communities. ",OMV,Sustainability Report 2013_EN.pdf,[101],0.0,2013,OMV Aktiengesellschaft,TEXT,"[""Owner and publisher OMV Aktiengesellschaft Trabrennstraße 6-8 1020 Vienna, Austria info.sustainability@omv.com""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +40,What is the company name?,Brazil Biodiversity aspects are a focus area for our operations in Brazil and improvement initiatives have been undertaken in collaboration with the local chapter of the World Business ,Total SA,NYSE_TOT_2015 annual.pdf,[1],0.0,2015,Total,TEXT,"[""TOTAL +COMMITTED TO BETTER ENERGY""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +41,What is the company name?,"Brazil Equinor’s social investment and sponsorship portfolio in Brazil has been reviewed based on four main objectives: (i) build long-term capability for the market through education; (ii) create opportunities for local communities, contributing to a reduction in social inequality; (iii) engage the entire Equinor Brazil organisation and build internal pride, (iv) improve brand recognition and enhance Equinor’s reputation in the local market. ",Equinor,sustainability-report-2019.pdf,[2],0.0,2019,Equinor,TEXT,"[""Equinor supports the Paris agreement and a net zero target +for society. We have already brought COâ‚‚ emissions in the oil +and gas production process down to industry leading levels, +and we will continue to do more. Our journey to develop as a +broad energy company is founded on a strong commitment to +sustainability, and our strategy - always safe, high value and +low carbon - is applied in everything we do.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +42,What is the company name?,"Business context and our approach Equinor is a global company with a presence in parts of the world where corruption represents a high risk. With a strategy to accelerate internationalisation and increase investments in new energy markets, 2019 represented a year of continued focus on ethics and anti-corruption. ",Wintershall Dea,Wintershall Dea annual report 2019.pdf,[1],0.0,2019,Wintershall Dea,TEXT,"[""wintershall dea""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +43,What is the company name?,"Business context and our approach Responsible management of our environmental impact is of great importance to Equinor. As a large offshore oil and gas operator and a growing offshore wind power provider, we have identified responsible management of the oceans as a sustainability priority area. ",Koninklijke Vopak NV,vopak_annual_report_2019.pdf,[2],0.0,2019,Vopak,TEXT,"[Vopak | Annual Report 2019 ""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +44,What is the company name?,CABOT OIL & GAS CORPORATION,Cabot Oil & Gas Corp,Cabot Oil & Gas Corp Annual Report 2016.pdf,[1],0.0,2016,CABOT OIL & GAS CORPORATION,TEXT,"[""CABOT OIL & GAS CORPORATION""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +45,What is the company name?,CABOT OIL & GAS CORPORATION 2017 Annual Report,Cabot Oil & Gas Corp,Cabot Oil & Gas Corp Annual Report 2017.pdf,[1],0.0,2017,CABOT OIL & GAS CORPORATION,TEXT,"[""CABOT OIL & GAS CORPORATION +2017 Annual Report""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +46,What is the company name?,"CCUS As a leader in CCUS, Equinor is working to build a European value chain, capturing and storing CO₂ from industrial plants that have CO₂ as a by-product, for example waste management facilities and cement producers. The Norwegian government is a key partner and has also set the ambition to develop a full-scale CCUS value chain in Norway by 2024.",Adani,Adani Group Adani Power Sustainability Report 2018.pdf,[1],0.0,2018-19,Adani Power Limited,TEXT,"[""Adani Power Limited""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +47,What is the company name?,"CIMAREX ENERGY CO. (NYSE: XEC) is an oil and gas exploration and production company with operations mainly located in Oklahoma, Texas and New Mexico. W",Cimarex Energy Co.,Cimarex Annual Report 2019.pdf,[2],0.0,2019,Cimarex Energy Co.,TEXT,"[""CIMAREX ENERGY CO. (NYSE: XEC) is an oil +and gas exploration and production company +with operations mainly located in Oklahoma, +Texas and New Mexico. W""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +48,What is the company name?,"CO₂ released to the atmosphere as a result of our processes and activities, including CO₂ emissions from energy generation, heat production, flaring (including well testing/well work-over), and remaining emissions from carbon capture and treatment plants. Separate data compiled for Equinor operated activities and equity basis.",NOVATEK,AR_FS_2017_ENG.pdf,[1],0.0,2017,PAO NOVATEK,TEXT,"[""PAO NOVATEK ANNUAL REPORT 2017""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +49,What is the company name?,Cabot Oil & Gas Corporation 2019 Annual Report,Cabot Oil & Gas Corp,Cabot Oil & Gas Corp Annual Report 2019.pdf,[9],0.0,2019,Cabot Oil & Gas Corporation,TEXT,"[""Cabot Oil & Gas Corporation +2019 Annual Report""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +50,What is the company name?,"Cabot Oil & Gas Corporation, headquartered in Houston, Texas, is an independent oil and gas producer. The Company's focused operations are centered around developing its natural gas resources in northeast Pennsylvania.",Cabot Oil & Gas Corp,Cabot Oil & Gas Corp Annual Report 2018.pdf,[3],0.0,2018,Cabot Oil & Gas Corporation,TEXT,"[""Cabot Oil & Gas Corporation, headquartered in Houston, Texas, is an independent oil and gas producer. The Company's focused operations are centered around developing its natural gas resources in northeast Pennsylvania.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +51,What is the company name?,"Callon Petroleum is an independent oil and natural gas company focused on the acquisition, exploration and development of high-quality assets in the heart of the Permian Basin. Our mission is to build trust, create value, and drive sustainable growth for our investors, our employees and the communities in which we operate.",Callon Petroleum Co,Callon Petroleum Co Annual Report 2017.pdf,[2],0.0,2017,Callon Petroleum,TEXT,"[""Callon Petroleum is an independent oil and natural gas company focused on the acquisition, +exploration and development of high-quality assets in the heart of the Permian Basin. +Our mission is to build trust, create value, and drive sustainable growth for our investors, +our employees and the communities in which we operate.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +52,What is the company name?,"Callon Petroleum is an independent oil and natural gas company focused on the acquisition, exploration, and development of high-quality assets in the leading oil plays of the Permian Basin in West Texas and Eagle Ford Shale in South Texas. Our mission is to build trust, create value, and drive sustainable growth for our investors, our employees, and the communities in which we operate.",Callon Petroleum Co,Callon Petroleum Co Annual Report 2019.pdf,[2],0.0,2019,Callon Petroleum,TEXT,"[""Callon Petroleum is an independent oil and natural gas company focused +on the acquisition, exploration, and development of high-quality assets +in the leading oil plays of the Permian Basin in West Texas and Eagle Ford +Shale in South Texas. Our mission is to build trust, create value, and drive +sustainable growth for our investors, our employees, and the communities +in which we operate.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +53,What is the company name?,Canadian Natural 2018 Annual Report Premium Value. Defined Growth. Independent.,Canadian Natural Resources Ltd,Canadian Natural Resources Annual Report 2018.pdf,[2],0.0,2018,Canadian Natural,TEXT,"[""Canadian Natural 2018 Annual Report Premium Value. Defined Growth. Independent.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +54,What is the company name?,Canadian Natural 2019 Annual Report 30 Years of Premium Value.,Canadian Natural Resources Ltd,Canadian Natural Resources Annual Report 2019.pdf,[2],0.0,2019,Canadian Natural,TEXT,"[""Canadian Natural 2019 Annual Report 30 Years of Premium Value.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +55,What is the company name?,"Canadian Natural demonstrated strong operational and financial performance throughout 2017 and completed its transition to a long life low decline asset base. The Company's focus on disciplined and balanced capital allocation continues, generating sustainable free cash flow for years to come.",Canadian Natural Resources Ltd,Canadian Natural Resources Annual Report 2017.pdf,[2],0.0,2017,Canadian Natural,TEXT,"[""Canadian Natural demonstrated strong operational and financial performance throughout 2017 and completed its transition to a long life low +decline asset base. The Company's focus on disciplined and balanced capital allocation continues, generating sustainable free cash flow for +years to come.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +56,What is the company name?,"Carbon costs and taxes Specific regulations (e.g. air quality, emission standards and fuel directives)",Cimarex Energy Co.,Cimarex Annual Report 2019.pdf,[2],0.0,2019,Cimarex Energy Co.,TEXT,"[""CIMAREX ENERGY CO. (NYSE: XEC) is an oil +and gas exploration and production company +with operations mainly located in Oklahoma, +Texas and New Mexico. W""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +57,What is the company name?,CenterPoint Energy,CenterPoint Energy,CenterPoint Energy Annual report 2019.pdf,[1],0.0,2019,CenterPoint Energy,TEXT,"[""CenterPoint Energy""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +58,What is the company name?,CenterPoint Energy 2016 Annual Report,CenterPoint Energy,CenterPoint Energy Annual report 2016.pdf,[1],0.0,2016,CenterPoint Energy,TEXT,"[""CenterPoint Energy 2016 Annual Report""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +59,What is the company name?,CenterPoint Energy 2016 Corporate Responsibility Report,CenterPoint Energy,CenterPoint Energy Corporate Responsibility report 2016.pdf,[1],0.0,2016,CenterPoint Energy,TEXT,"[""CenterPoint Energy 2016 Corporate Responsibility Report""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +60,What is the company name?,Cheniere 2019 corporate responsibility report,Cheniere Energy,Cheniere Energy Corporate Responsibility Report 2019.pdf,[1],0.0,2019,Cheniere ,TEXT,"[""Cheniere 2019 corporate responsibility report""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +61,What is the company name?,"Cheniere energy, inc.",Cheniere Energy,Cheniere Energy Annual report 2019.pdf,[1],0.0,2019,Cheniere Energy,TEXT,"[""Cheniere energy, inc.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +62,What is the company name?,"Cheniere energy, inc. 2017 annual report",Cheniere Energy,Cheniere Energy Annual report 2017.pdf,[1],0.0,2017,Cheniere ,TEXT,"[""Cheniere energy, inc. 2017 annual report""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +63,What is the company name?,"Cheniere energy, inc. 2018 annual report",Cheniere Energy,Cheniere Energy Annual report 2018.pdf,[1],0.0,2018,Cheniere Energy,TEXT,"[""Cheniere energy, inc. 2018 annual report""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +64,What is the company name?,Chesapeake energy,Chesapeake energy,Chesapeake 2018 Annual Report.pdf,[1],0.0,2018,Chesapeake energy,TEXT,"[""Chesapeake energy""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +65,What is the company name?,"Chronical effects (e.g. sea water rise, increased scarcity of water) Acute effects (e.g. more frequent and more extreme weather events)",Surgutneftegas,GO SNG 2018 Eng annual.pdf,[2],0.0,2018,Surgutneftegas,TEXT,"[""At the moment, ""Surgutneftegas"" PJSC +develops six fields in Eastern Siberia, +the volume of production continues +to increase: in 2018, oil production +was 9.1 million tonnes, making 15% +of the Company's total oil production. +In 2019, the Company expects to put on +stream one more field in the Republic +of Sakha (Yakutia) - the Lenskoye field, +where we are actively engaged in building +the infrastructure. In the next 3-4 years, +oil production at this field is expected to +reach 1.5-2 million tonnes per year.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +66,What is the company name?,"Code of Conduct - The Code of Conduct sets out our commitment and requirements for how we work at Equinor. It applies to employees, Equinor board members and hired contractors. We train our employees on how to apply the Code of Conduct in their work. All Equinor employees are required to confirm annually that they understand and will comply with the Code of Conduct. We expect our suppliers to act in a way that is consistent with our Code of Conduct. We engage with our suppliers to help them understand our ethical requirements and how we do business. If the expectations are not met, we take appropriate actions.","Aktsionernoe Obshchestvo Rosneftegaz, Moscow",RN_SR2018_eng_web_1 sustainability 2017.pdf,[1],0.0,2017,Rosneft,TEXT,"[""ROSNEFT""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +67,What is the company name?,"Competence development and awareness for all staff is important to strengthen security culture. Our security month in 2019 had the theme See Something, Say Something which was designed to simplify the incident reporting process. An increasing international presence places renewed importance on travel security. We developed specific country requirements for travelers and made them more easily accessible through company Apps and online platforms. ",AES Corporation ,AES Corporation 2018_SustainabilityReport_vFinal.pdf,[4],0.0,2018,The AES Corporation,TEXT,"[""The AES Corporation (NYSE: AES) is a Fortune 200 global power company founded in 1981. The company's headquarters are in Arlington, Virginia, United States (US). AES is publicly traded company, incorporated in Delaware and governed by a Board of Directors.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +68,What is the company name?,"Consistent with our values and to strengthen our brand and attractiveness as an employer, we successfully implemented a global parental leave policy in all Equinor companies and health insurance in Equinor ASA effective from January 2019. A minimum of 16 weeks paid leave is offered to all employees in the group becoming parents through birth or adoption. The health insurance scheme, supplementing public health services, offers access to private specialists, medical examinations and treatments, and is similar to local health insurance already provided in our subsidiaries. We expect the scheme to have a positive effect on employees’ health and believe that both benefits ",Ameren Corporation,Ameren Corporation Sustainability Template 2019.pdf,[1],0.0,2019,Ameren,TEXT,"[""Ameren""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +69,What is the company name?,"Corporate Name: ENDESA, S.A.",ENDESA,Endesa SA Annual Report 2017.pdf,[1],0.0,2017,ENDESA,TEXT,"[""Corporate Name: ENDESA, S.A.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +70,What is the company name?,Countries in which supplier HR verifications undertaken,CenterPoint Energy,CenterPoint Energy Corporate Responsibility report 2017.pdf,[1],0.0,2017,CenterPoint Energy,TEXT,"[""CenterPoint Energy""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +71,What is the company name?,"Creating shared value with communities Equinor’s transition to a global energy company requires systematic development of competence and access to new talent. We empower our people to execute on business ambitions, while promoting personal growth and development. Through learning and development activities we prepare for increased digitalisation and new ways of working. As part of our long-term commitment to creating shared value, Equinor emphasises building skills and capacity in the communities where we have activities. A large portion of our sponsorships, donations and social investments is allocated to capacity building within science, technology, engineering and mathematics (STEM), through partnerships with academic institutions and support to science centres. Our academia collaboration with key universities increasingly addresses the energy transition and new energy solutions. Through our Heroes of Tomorrow programme, we give children and youth the opportunity to develop their talents within the areas of sports, culture and education. In 2019, our corporate sponsorships spend was USD 19.2 million.",Callon Petroleum Co,Callon Petroleum Co Annual Report 2019.pdf,[2],0.0,2019,Callon Petroleum,TEXT,"[""Callon Petroleum is an independent oil and natural gas company focused +on the acquisition, exploration, and development of high-quality assets +in the leading oil plays of the Permian Basin in West Texas and Eagle Ford +Shale in South Texas. Our mission is to build trust, create value, and drive +sustainable growth for our investors, our employees, and the communities +in which we operate.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +72,What is the company name?,"Creating shared value: Economic and social impact, Local procurement, Employment, People development, Innovation and research and development activities",CenterPoint Energy,CenterPoint Energy Annual report 2018.pdf,[1],0.0,2018,CenterPoint Energy,TEXT,"[""CenterPoint Energy""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +73,What is the company name?,"DCP MIDSTREAM, LP (Exact name of registrant as specified in its charter)",DCP Midstream,2019 DCP Midstream annual report.pdf,[1],0.0,2019,DCP Midstream,TEXT,"[""DCP MIDSTREAM, LP (Exact name of registrant as specified in its charter)""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +74,What is the company name?,Develop people and promote diversity and inclusion,NRG,nrg-sustainability-report_2017.pdf,[14],0.0,2017,NRG Energy,TEXT,"[""This sustainability report is based on NRG corporate performance for all operations in calendar year 2017 and, where stated, ""NRG"" refers to NRG Energy, Inc., as well as its affiliates that include assets owned by NRG Energy, Inc. and NRG Yield, Inc.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +75,What is the company name?,"Developing our people As Equinor develops into a broad energy company and accelerates the use of digital solutions, our ability to drive people development is critical to the delivery of our business strategy. Building a culture of lifelong learning where our employees develop new skills faster to match changing job requirements, has been a key focus area in 2019. We continue to use deployment across the company as a strong tool for driving on-the-job learning. Through all the academies in The Equinor University we intensified our formal learning activities, particularly relating to safety and digitalisation. In 2019, we more than tripled our learning activities in digital topics, including the introduction of ‘Digital Leadership’ training for our leaders. In addition, we significantly increased learning activities across the company, using e-learning and virtual classrooms as a flexible, accessible and cost-effective means to increase participation. ",Southern Company,Southern Company_2018_Corporate_Responsibility_Report.pdf,[1],0.0,2018,Southern Company,TEXT,"[""Southern Company is transitioning our energy generation fleet for a low-carbon future. In doing so, we have established an intermediate goal of a 50 percent reduction in carbon emissions from 2007 levels by 2030 and a long-term goal of low- to no-carbon operations by 2050.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +76,What is the company name?,"Devon Energy is proud to present our 2019 Sustainability Report, highlighting our efforts to deliver industry-leading results, while setting the standard as a good neighbor, valued community partner, caring environmental steward and model employer.",Devon Energy,DVN_SR19_0_FULL-REPORT_060820.pdf,[3],0.0,2019,Devon Energy,TEXT,"[""Devon Energy is proud to present our 2019 Sustainability Report, highlighting our efforts to deliver industry-leading results, while setting the standard as a good neighbor, valued community partner, caring environmental steward and model employer.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +77,What is the company name?,"Devon is a leading independent energy company engaged primarily in the exploration, development and production of oil, natural gas and NGLs. Our operations are concentrated in various North American onshore areas in the U.S. and Canada. Our portfolio of oil and gas properties provides stable, environmentally responsible production and a platform for future growth. We have doubled our onshore North American oil production since 2010 to more than 275 MBbls per day and have a deep inventory of development opportunities. Devon also produces over 1.6 Bcf of natural gas a day and more than 136 MBbls of NGLs per day.",Devon,NYSE_DVN_2015.pdf,[8],0.0,2015,Devon,TEXT,"[""Devon is a leading independent energy company engaged primarily in the exploration, development and +production of oil, natural gas and NGLs. Our operations are concentrated in various North American onshore +areas in the U.S. and Canada. Our portfolio of oil and gas properties provides stable, environmentally responsible +production and a platform for future growth. We have doubled our onshore North American oil production since +2010 to more than 275 MBbls per day and have a deep inventory of development opportunities. Devon also +produces over 1.6 Bcf of natural gas a day and more than 136 MBbls of NGLs per day.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +78,What is the company name?,"Digitalisation Equinor’s digital roadmap is progressing well. New digital technologies are implemented to help us reach our goals of improved safety performance, reduced emissions and higher value. The integrated operations support centre, established in 2018, will be central in reducing CO₂ emissions from the NCS. Equinor has so far connected 20 of its assets to this centre, streaming data to our cloud-based data platform. By end of 2020 all operated fields on the NCS will be connected. Cross-functional teams utilise this data to discover opportunities for energy efficiency measures, safety and value improvements. Another centre, the geo-operations centre, ensures more efficient and better geoscience control of drilling operations, as well as cost savings and improved personnel safety. Further, subsurface data are connected and analysed in new ways through our subsurface data lake, enhancing the reservoir performance. Our digital field worker concept is also being broadly implemented, allowing our operators and engineers easy access to data enabling improved safety performance, higher efficiency and reduced carbon footprint. Workforce diversity and inclusion Embracing diversity and driving inclusion is a fundamental part of our values - open, collaborative, courageous and caring - and an integral part of our leadership expectations. This includes working actively to ensure that everyone has equal opportunities at Equinor. In 2019, we continued to strengthen diversity and inclusion in Equinor by embedding it into our key human resources processes, such as recruitment, succession planning, performance management and leadership development. We monitor diversity in our workforce at all levels and locations and encourage and support employee initiatives that contribute to a diverse and inclusive culture. In 2019, we established guidelines to further support employee resource groups in Equinor, including Women in Equinor, Differently Abled and LGBTQ+ groups. ",CenterPoint Energy,CenterPoint Energy Annual report 2019.pdf,[1],0.0,2019,CenterPoint Energy,TEXT,"[""CenterPoint Energy""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +79,What is the company name?,Direct GHG emissions from operations that are owned and/or controlled by the organisation. ,LOTOS Group,2_LOTOS_Group Directors Report 2019.pdf,[5],0.0,2019,LOTOS ,TEXT,"[""Grupa LOTOS S.A. is the second largest fuel producer in Poland. The Company's refinery in GdaÅ„sk is among the newest, the most advanced and most environmentally-friendly plants of this type in Europe. In 2019, the refinery operated at full capacity, having processed 10.7m tonnes of crude oil.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +80,What is the company name?,"Drilling operations create large quantities of rock cuttings contaminated with drilling mud and fluids from the rock formations. These rock cuttings are in many offshore cases grinded into a slurry and injected into subsurface formations for permanent storage. In other cases, rock cuttings are collected and transported to shore for cleaning and disposal or, in cases where water-based mud is used, discharged to sea. In many cases where oil-based drilling mud is used, transport of drill cuttings to shore for treatment and disposal is needed, requiring comprehensive logistical solutions and waste handling onshore. Thermomechanical cuttings cleaning (TCC), in which oil is removed from the drill cuttings through mechanical friction and heating, offers improved treatment of drill cuttings offshore and makes discharge of such cutting ",Teekay Corp,2017-Sustainability-Report.pdf,[1],0.0,2017,TEEKAY CORPORATION,TEXT,"[""TEEKAY CORPORATION 2017 Sustainability Report""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +81,What is the company name?,"During 2019 Equinor undertook a comprehensive review of its memberships in industry associations that have a position on climate and energy policy. Equinor holds membership and is engaged in more than 100 energy and climate associations and initiatives globally, of which approximately 25% are non- advocacy. We have inquired the associations with an active policy agenda to determine whether their respective climate stance is in alignment with Equinor's. After a screening of more than 80 associations within scope, some of the associations have been subject to a deeper assessment where they were contacted in written and feedback was received. ",EVN,Vietnam Electricity Corporation (EVN)_AnnualReport2018(1).pdf,[46],0.0,2018,Vietnam Electricity,TEXT,"[""VIETNAM ELECTRICITY 11 Cua Bac street, Ba Dinh district, Hanoi, Vietnam Website: http://www.evn.com.vn Telephone: 024.66946789 | Fax: 024.66946666""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +82,What is the company name?,"During 2019, we continued our efforts towards awareness and training on human rights across the company. The senior leadership team continued to develop their approach to human rights throughout 2019, discussing the topic for more than six hours in the corporate executive committee meetings. In addition, our human rights efforts were discussed and evaluated in two meetings by the Board of Directors Safety, Sustainability and Ethics Committee and once with the full Board of Directors. Every business area management committee and most functional management teams have conducted targeted awareness sessions at least once. ",RWE,RWE-csr_overall-report-2019.pdf,[26],0.0,2019,RWE AG,TEXT,"[""RWE AG is meeting the obligation to publish a Non-financial Report envisaged pursuant to the German Commercial Code (HGB) in a separate section of this CR report.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +83,What is the company name?,EDF group is the world's leading electricity company and global leader for low-carbon energy production.,EDF,EDF-ddr-2017-accessible-version-en.pdf,[5],0.0,2017,EDF Group,TEXT,"[""EDF group is the world's leading electricity company and global leader for low-carbon energy production.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +84,What is the company name?,ELEKTRİK RETİM A.Ş. ELECTRICITY GENERATION CO.,Elektrik Üretim A.Ş.,Elektrik Üretim A.Ş. Genel Müdürlüğü (EÜAŞ) Annual Report 2018.pdf,[1],0.0,2018,ELEKTRİK ÜRETİM A.Ş.,TEXT,"[""ELEKTRİK ÜRETİM A.Ş. ELECTRICITY GENERATION CO.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +85,What is the company name?,"ENDESA, S.A. Financial Statements for the year ended 31 December 2018 5 ENDESA, S.A. and Subsidiaries Consolidated Financial Statements for the year ended 31 December 2018 207",ENDESA,Endesa SA Annual Report 2018.pdf,[3],0.0,2018,ENDESA,TEXT,"[""ENDESA, S.A. Financial Statements for the year ended 31 December 2018 5 ENDESA, S.A. and Subsidiaries Consolidated Financial Statements for the year ended 31 December 2018 207""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +86,What is the company name?,ENI IN THE WORLD,Eni SpA,EniFor-2018-eng.pdf,[6],0.0,2018,Eni,TEXT,"[""ENI IN THE WORLD""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +87,What is the company name?,"Early Talents We continue to invest in our early talents through our graduate and apprentice programmes. In 2019, we welcomed 182 graduates and 157 apprentices. Through our recruitment and attraction activities we strive to increase the diversity of our early talent applicant base and hires, and our ambition was to achieve a 50-50 balance on gender and non-Norwegian background in 2019. In 2019, we made strides towards achieving this goal with a 43-57 split between female and male graduates recruited, and a 45-55 split between graduates recruited with a non- Norwegian and Norwegian background.",Adani,Adani Group Adani Power Annual Report 2019.pdf,[1],0.0,2018-19,Adani Power Limited,TEXT,"[""Adani Power Limited""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +88,What is the company name?,"Employee relations We believe in involving our people in the development of the company. In all countries where we are present, we involve our employees and/or their appropriate representatives according to local laws and practices. This varies from formal bodies with employee representatives to employee engagement and involvement through team or town hall meetings. ",CenterPoint Energy,CenterPoint Energy Annual report 2017.pdf,[1],0.0,2017,CenterPoint Energy,TEXT,"[""CenterPoint Energy""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +89,What is the company name?,Eni Annual Report 2018,Eni SpA,Annual-Report-2018.pdf,[5],0.0,2018,Eni,TEXT,"[""Eni Annual Report 2018""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +90,What is the company name?,"Environment of Norway. Its task is to promote a shift towards more environmentally friendly energy consumption and production, as well as the development of energy and climate technology.",Enel,Enel annual-report-2018.pdf,[9],0.0,2018,Enel Group,TEXT,"[""The Enel Group structure is organized into a matrix that comprises: +>>Business Lines (Global Thermal Generation, Global Trading, Global Infrastructure and Networks, Enel Green Power, Enel X), which are responsible for managing and developing assets, optimizing their performance and the return on capital employed in the various geographical areas in which the Group operates. The Business Lines are also responsible for improving the efficiency of the processes they manage and sharing best practices at the global level. The Group will benefit from a centralized industrial vision of projects in the various Business Lines. Each project will be assessed not only on the basis of its financial return but also in relation to the best technologies available at the Group level, +>>Regions and Countries (Italy, Iberia, South America, Europe and Euro-Mediterranean Affairs, North and Central America, Africa, Asia and Oceania), which are responsible for managing relationships with institutional bodies and regulatory authorities, as well as selling electricity and gas, in each of the countries in which the Group operates, while also providing staff and other service support to the Business Lines.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +91,What is the company name?,Equinor Brazil has approved a new social investment initiative which is inspired and guided by the UN’s ,OMV,dload_Sustainability Report 2018_en.pdf,[2],0.0,2018,OMV Group,TEXT,"[""This report covers the operations of the OMV Group, headquartered in Vienna, Austria, for the 2018 business year.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +92,What is the company name?,Equinor Sustainability report 2019 Always safe - Responsible operationsEquinor Sustainability report 2019 Always safe - Responsible operations,BASF SE,BASF_Report_2018.pdf,[1],0.0,2018,BASF,TEXT,"[""BASF Report 2018""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +93,What is the company name?,Equinor Sustainability report 2019 Always safe - Responsible operationsEquinor Sustainability report 2019 Always safe - Responsible operations0.511.522.533.5201520162017201820190Sulphur Oxides (SOx)(thousand tonnes)2.51.81.71.82.2Regular discharges of oil to water(thousand tonnes)00.20.40.60.811.21.41.6201520162017201820191.41.41.21.11.2,EDF,EDF-ddr-2018-en.pdf,[3],0.0,2018,EDF Group,TEXT,"[""A key player in the energy transition, EDF group is an integrated energy company, active in all areas of the business: generation, transmission, distribution, trading, energy supply and energy services. As a global leader in low-carbon energy, the Group has developed a diversified generation mix based on nuclear power, thermal energy, hydropower and other renewable energies.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +94,What is the company name?,Equinor Sustainability report 2019 Equinor. Sustainability report 2019 ,Ameren Corporation,Ameren_2019_Annual_Report.pdf,[1],0.0,2019,Ameren,TEXT,"[""Ameren""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +95,What is the company name?,Equinor Sustainability report 2019 High value — creating shared value,Tatneft,PJSC Tatneft annual report 2015.pdf,[3],0.0,2015,TATNEFT,TEXT,"[""TATNEFT Company successfully accomplished all of the planned programs in 2015. In the difficult macroeconomic +environment the Company implemented a set of production and economic compensatory measures to maintain +the Company's status in the group of the leaders of the Russian fuel and energy complex.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +96,What is the company name?,"Equinor Sustainability report 2019Always safe - Responsible operationsEquinor Sustainability report 2019 Always safe - Responsible operations(million hours)Total serious incident frequencyTarget 2019Hours worked0.60.80.60.50.60.401002003004000123420152016201720182019(million hours)Total recordable injury frequencyTarget 2019Working hours2.72.7125.3128128.9123.71472.82.82.5(cubic metres)1,8003,6005,4007,2009,000(number per year)6012018024030020152016201720182019Number of spillsVolume of oil spills172146207238219316134138898321010203020152016201720182019Target 201918151210Oil and gas leakages",Diamondback Energy,Diamondback 2019 Corporate Responsibility_2.pdf,[2],0.0,2018,Diamondback Energy,TEXT,"[""This is the second annual corporate responsibility report for Diamondback Energy, Inc. (""Diamondback""). +Except where otherwise noted, the scope of this report comprises all operations (excluding Viper Energy +Partners) and includes data through December 31, 2018.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +97,What is the company name?,Equinor Sustainability report 2019AppendicesEquinor Sustainability report 2019 Appendices,AGL Energy Ltd,AGL Energy Ltd Annual Report 2019.pdf,[1],0.0,2019,AGL,TEXT,"[""agl""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +98,What is the company name?,Equinor Sustainability report 2019High value — creating shared valueEquinor Sustainability report 2019 High value — creating shared value,NOVATEK,AR_FS_2017_ENG.pdf,[4],0.0,2017,NOVATEK,TEXT,"[""About the Company NOVATEK is one of the largest independent natural gas producers in Russia""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +99,What is the company name?,Equinor Sustainability report 2019Low carbon — Creating a low carbon advantage,Aker BP,Aker-BP-Sustainability-Report-2018-1.pdf,[1],0.0,2018,Aker BP,TEXT,"[""Aker BP""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +100,What is the company name?,Equinor Sustainability report 2019Low carbon — Creating a low carbon advantageEquinor Sustainability report 2019Low carbon — Creating a low carbon advantage,BASF SE,BASF_Report_2017.pdf,[1],0.0,2017,BASF,TEXT,"[""BASF Report 2017""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +101,What is the company name?,Equinor Sustainability report 2019Sustainability at EquinorEquinor Sustainability report 2019 Sustainability at Equinor,OMV,Sustainability Report 2017_EN.pdf,[67],0.0,2017,OMV Aktiengesellschaft,TEXT,"[""OMV Aktiengesellschaft Trabrennstrasse 6 - 8 1020 Vienna, Austria Tel. +43 1 40440-0 info@omv.com www.omv.com""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +102,What is the company name?,"Equinor and partners plan to maximise the utilisation of power from shore for the Utsira High area. In the second phase of the Johan Sverdrup field development, a power hub will be installed, allowing for the Gina Krog, Ivar Aasen and Edvard Grieg fields, as well as Johan Sverdrup second phase, to be powered from the onshore grid. In October 2019, Equinor announced that the area’s license partners are working towards a partial electrification of the Sleipner field, together with the Gudrun platform and other tie-ins. In total ten fields will receive power through the Utsira High area solution, contributing to an average reduction of 1.2 million tonnes of CO₂ per year. ",Devon Energy,DVN_SR19_0_FULL-REPORT_060820.pdf,[3],0.0,2019,Devon Energy,TEXT,"[""Devon Energy is proud to present our 2019 Sustainability Report, highlighting our efforts to deliver industry-leading results, while setting the standard as a good neighbor, valued community partner, caring environmental steward and model employer.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +103,What is the company name?,"Equinor is currently introducing a new operational planning tool aimed at improving operational safety and risk management at onshore and offshore installations during operations and maintenance. It is designed to strengthen compliance with work processes for safe work, including work permits, safe job analysis, isolation plans and operational risk assessments. Live overview of planned and ongoing activities is displayed along with factors affecting risk exposure such as leaks and seeps, dispensations and other operational conditions. Gathering all safe work information in one system provides a better overview of the total risk picture of the installation and thereby enables improved risk management. ",Devon,NYSE_DVN_2015.pdf,[8],0.0,2015,Devon,TEXT,"[""Devon is a leading independent energy company engaged primarily in the exploration, development and +production of oil, natural gas and NGLs. Our operations are concentrated in various North American onshore +areas in the U.S. and Canada. Our portfolio of oil and gas properties provides stable, environmentally responsible +production and a platform for future growth. We have doubled our onshore North American oil production since +2010 to more than 275 MBbls per day and have a deep inventory of development opportunities. Devon also +produces over 1.6 Bcf of natural gas a day and more than 136 MBbls of NGLs per day.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +104,What is the company name?,"Equinor owns and operates the South Riding Point (SRP) terminal for storage and transshipment of oil, located on Grand Bahama Island. In September 2019, the country was impacted by Hurricane Dorian, resulting in the worst natural disaster in its history. In advance of the impact, Equinor shut down SRP operations and took measures to secure personnel and the facility. In line with normal procedure, our emergency preparedness organisation was also engaged. At the time the hurricane arrived, we had 54 personnel on Grand Bahama. All were confirmed safe and accounted for. However, the terminal sustained damage and an oil spill was confirmed at a volume of 55,000 barrels out of 1,870 million barrels stored. Most of the spilled volumes ",OMV,Sustainability Report 2012_EN.pdf,[2],0.0,2012,OMV,TEXT,"[""OMV Sustainability Report 2012 The OMV Sustainability Report covers the 2012 business year and describes our sustainability performance and relevant data""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +105,What is the company name?,"Equinor supports the Paris agreement and a net zero target for society. We have already brought CO‚‚ emissions in the oil and gas production process down to industry leading levels, and we will continue to do more. Our journey to develop as a broad energy company is founded on a strong commitment to sustainability, and our strategy - always safe, high value and low carbon - is applied in everything we do.",Equinor,sustainability-report-2019.pdf,[2],0.0,2019,Equinor,TEXT,"[""Equinor supports the Paris agreement and a net zero target +for society. We have already brought COâ‚‚ emissions in the oil +and gas production process down to industry leading levels, +and we will continue to do more. Our journey to develop as a +broad energy company is founded on a strong commitment to +sustainability, and our strategy - always safe, high value and +low carbon - is applied in everything we do.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +106,What is the company name?,"Equinors’ strategy defines ‘’Always safe’’ as one of its three main elements and our ambition is to be a leader in safety and security in our industry. Based on a review of best practices in previous years, areas for improvement have been identified, and in 2019 several initiatives aimed at strengthening the safety culture and consistency across the company were rolled out. ",Aker BP,AKERBP-Annual-Report-2017.pdf,[1],0.0,2017,Aker BP,TEXT,"[""AKER BP ASA""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +107,What is the company name?,"Equinor’s Climate Roadmap sets out new short-, mid- and long-term ambitions to reduce our own greenhouse gas emissions and to shape our portfolio. To achieve these ambitions, we need to strengthen our collaboration with governments, customers, and industry sectors to speed up the pace of the transition and deliver solutions at scale. Therefore, it is also a standing invitation to engage in a dialogue and work with us in shaping a more sustainable energy future. ","Aktsionernoe Obshchestvo Rosneftegaz, Moscow",annual 2017.pdf,[1],0.0,2017,Rosneft,TEXT,"[""ROSNEFT""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +108,What is the company name?,"Equinor’s expectations are that policy measures should: • • be predictable, transparent and internationally aligned, to trigger investments and innovation • phase out subsidies on fossil fuels that exacerbate climate change and undermine the effects of other policy ",ROMGAZ,2017 Sustainability Report.pdf,[3],0.0,2017,Romgaz S.A,TEXT,"[""This is the first sustainability report published by S.N.G.N. Romgaz S.A. The report on the activity of 2017 shows for the first time the non-financial performance and details the material topics identified by the first materiality study performed by the company.']",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +109,What is the company name?,"Equinor’s purpose is to turn natural resources into energy for people and progress for society. Our strategy – always safe, high value and low carbon – positions us to deliver long-term value in a low carbon future. This is reflected in our vision: Shaping the future of energy. We are developing from an oil and gas company to a broader energy company. Our three sustainability priorities – responsible operations, creating a low-carbon business advantage, and creating shared value – are embedded in our strategy. ",PAO OGK-2,PAO OGK-2_AR 2018.pdf,[2],0.0,2018,JSC OGK-2,TEXT,"[""JSC OGK-2""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +110,What is the company name?,Establishment and implementation of company-wide processes focusing on closed loop learning and assurance activities are done to ensure better learning and experience transfer. ,Ervia,Ervia-Annual-Report-2018.pdf,[4],0.0,2018,Ervia,TEXT,"[""At Ervia we have a pivotal role to play +in enhancing the environment, leading +the transition to a low carbon energy +system, protecting precious water +resources and increasing resilience.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +111,What is the company name?,FEBRUARY 2020 DCP Midstream Sustainability Report,DCP Midstream,DCP Midstream sustainability report 2020.pdf,[1],0.0,2020,DCP Midstream,TEXT,"[""FEBRUARY 2020 DCP Midstream Sustainability Report""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +112,What is the company name?,Feedback We welcome your feedback. Please use the e-mail and social media channels linked below for comments and questions. ,"Aktsionernoe Obshchestvo Rosneftegaz, Moscow",annual 2016.pdf,[1],0.0,2016,Rosneft,TEXT,"[""ROSNEFT FOR THE BENEFIT OF RUSSIA""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +113,What is the company name?,"Fiscal 2017 was yet another outstanding year for Berry. We celebrated our 50th year in business, we were added to the Fortune 500 list, completed two acquisitions, and delivered strong financial results. Specifically, in fiscal 2017, we delivered revenue of $7.1 billion, operating EBITDA of $1.33 billion and adjusted free cash flow of $601 million, all records for any fiscal year in the Company's history. Additionally, the value of Berry's stock rose over 29% during fiscal year 2017. These extraordinary results reflect the strong fundamental strategies of our expanded global businesses, contributions from our acquisitions, as well as a relentless focus on execution by our dedicated employees.",Berry,2017 Annual Report Proof -01.19.18.pdf,[3],0.0,2017,Berry,TEXT,"[""Fiscal 2017 was yet another outstanding year for Berry. We celebrated our +50th year in business, we were added to the Fortune 500 list, completed +two acquisitions, and delivered strong financial results. Specifically, in +fiscal 2017, we delivered revenue of $7.1 billion, operating EBITDA of $1.33 +billion and adjusted free cash flow of $601 million, all records for any fiscal +year in the Company's history. Additionally, the value of Berry's stock rose +over 29% during fiscal year 2017. These extraordinary results reflect the strong fundamental strategies of our +expanded global businesses, contributions from our acquisitions, as well as a relentless focus on execution by +our dedicated employees.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +114,What is the company name?,"Following the agreement of peer collaboration on human rights supplier assessments in 2018, a platform for sharing and viewing of assessments has been developed and will be launched in 2020. This industry-first initiative will drive collaboration in the follow up process towards energy company suppliers. ",Delek US,Delek2016Annual Report 10 K.pdf,[2],0.0,2016,Delek US,TEXT,"[""Founded in 2001, Delek US Holdings, Inc. +(NYSE: DK) is a downstream energy company with +assets in petroleum refining and logistics. Delek +US consists of two business segments: refining +and logistics. Delek US Holdings, Inc. also owns +approximately 47 percent of the outstanding common +stock of Alon USA Energy, Inc. (NYSE: ALJ).""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +115,What is the company name?,"Founded in 2001, Delek US Holdings, Inc. (NYSE: DK) is a downstream energy company with assets in petroleum refining and logistics. Delek US consists of two business segments: refining and logistics. Delek US Holdings, Inc. also owns approximately 47 percent of the outstanding common stock of Alon USA Energy, Inc. (NYSE: ALJ).",Delek US,Delek2016Annual Report 10 K.pdf,[2],0.0,2016,Delek US,TEXT,"[""Founded in 2001, Delek US Holdings, Inc. +(NYSE: DK) is a downstream energy company with +assets in petroleum refining and logistics. Delek +US consists of two business segments: refining +and logistics. Delek US Holdings, Inc. also owns +approximately 47 percent of the outstanding common +stock of Alon USA Energy, Inc. (NYSE: ALJ).""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +116,What is the company name?,"Founded in 2001, Delek US Holdings, Inc. (NYSE: DK) is a downstream energy company with assets in petroleum refining, logistics and convenience store retailing.",Delek US,2017Delek AR1 final smaller file size.pdf,[2],0.0,2017,Delek US,TEXT,"[""Founded in 2001, Delek US Holdings, Inc. +(NYSE: DK) is a downstream energy company +with assets in petroleum refining, logistics +and convenience store retailing.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +117,What is the company name?,"From 2020, with the addition of a full year of production from the electrified Johan Sverdrup field, we expect the CO₂ intensity to improve. As such, and due to several identified CO₂ emission reduction measures in Norway, the 2030 CO₂ intensity ambition has been moved forward to 2025. ",Saipem SpA,ANNUAL REPORT 2017.pdf,[2],0.0,2017,Saipem SpA,TEXT,"[""Board of Directors and auditors of Saipem SpA""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +118,What is the company name?,"From a financial, operational and strategic perspective, 2017 was a strong year for Xcel Energy.",XCEL,Xcel_Energy-AR2017.pdf,[3],0.0,2017,Xcel Energy,TEXT,"[""From a financial, operational and strategic perspective, 2017 was a strong year for Xcel Energy.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +119,What is the company name?,GAZPROM GROUPS SUSTAINABILITY REPORT 2018,Gazprom ,sustainability-report-en-2018.pdf,[1],0.0,2018,GAZPROM,TEXT,"[""GAZPROM GROUP´S SUSTAINABILITY REPORT 2018""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +120,What is the company name?,"Grupa LOTOS S.A. is the second largest fuel producer in Poland. The Company's refinery in Gda„sk is among the newest, the most advanced and most environmentally-friendly plants of this type in Europe. In 2019, the refinery operated at full capacity, having processed 10.7m tonnes of crude oil.",LOTOS Group,2_LOTOS_Group Directors Report 2019.pdf,[5],0.0,2019,LOTOS ,TEXT,"[""Grupa LOTOS S.A. is the second largest fuel producer in Poland. The Company's refinery in GdaÅ„sk is among the newest, the most advanced and most environmentally-friendly plants of this type in Europe. In 2019, the refinery operated at full capacity, having processed 10.7m tonnes of crude oil.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +121,What is the company name?,"Health and working environment A healthy, inclusive and safe working environment is important to ensure safe and efficient operations. To maintain a good working environment in the long term, we systematically monitor trends related to illness, and especially work-related illness. A significant contributor to the latter has been psychosocial aspects and these have therefore been actively managed and monitored ",Aker BP,Aker-BP-Sustainability-Report-2019.pdf,[1],0.0,2019,Aker BP,TEXT,"[""AkerBP""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +122,What is the company name?,"Health and working environment are integral parts of our efforts to safeguard people by focusing on risk management of factors such as chemicals, noise, ergonomic workplace and psychosocial aspects. To reduce downsides and realise sustainable and lasting upsides, we monitor and manage psychosocial aspects on an ongoing basis. As our international presence develops, the company is presented with different sets of security risks that we need to manage. The security threat landscape has evolved significantly since we launched our five-year security roadmap in 2015. Equinor faces a high threat of targeted terrorist attacks in some locations, furthermore, criminal violence is a concern for staff at some of the assets and offices. Worldwide there is a high threat of cyber-attacks, and this is expected to continue to grow. Against this backdrop, we continue to address these threats through a strengthened security culture and organisation which seeks to manage all security risks to our people, assets and information.",Cenovus Energy,Cenovus Annual Report 2019.pdf,[1],0.0,2019,Cenovus Energy,TEXT,"[""cenovus ENERGY""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +123,What is the company name?,"High value: We deliver energy to millions of people and create value for our shareholders. Through our core business and supply chain, we create economic value and opportunities for society and communities. We provide jobs and develop capabilities among our own employees and beyond our company. ",Transocean Ltd,Transocean_Sustain_digital_FN_4 2017_2018.pdf,[1],0.0,2017/2018,Transocean,TEXT,"[""Transocean Sustainability Report 2017/2018""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +124,What is the company name?,"However, to learn and improve our business activities we evaluate near-misses and undesirable conditions with respect to the potential for major accidents under slightly different circumstances. Last year we identified two conditions with major accident potential. A pressure vessel valve at the Hammerfest LNG plant in Norway had weaknesses that could have resulted in a situation of overpressure, a large hydrocarbon leakage and subsequent ignition. And a blowout preventer at the Gullfaks C platform offshore Norway had internal damage and design issues that could have caused a well control situation developing into a blowout.",Total SA,NYSE_TOT_2016 annual.pdf,[1],0.0,2016,Total,TEXT,"[""TOTAL""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +125,What is the company name?,Human rights in the supply chain The supply chain continues to be an important focus area for our human rights efforts in Equinor. ,Devon,NYSE_DVN_2017.pdf,[8],0.0,2017,Devon,TEXT,"[""A Delaware corporation formed in 1971, and publicly held since 1988, Devon (NYSE: DVN) is an +independent energy company engaged primarily in the exploration, development and production of oil, natural gas +and NGLs. Our operations are concentrated in various North American onshore areas in the U.S. and Canada. +Additionally, we control EnLink, a publicly traded MLP with an integrated midstream business with significant size +and scale in key operating regions in the U.S. For additional information regarding our control of, and ownership +interest in, EnLink and its indirect general partner, the General Partner, see Note 20 in ""Item 8. Financial Statements +and Supplementary Data"" of this report.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +126,What is the company name?,"I am safety expectations at all organisational levels were launched in 2019, this to enhance employee engagement and more active risk management. The aim is to ensure a more consistent behavioural pattern across the company. ",Fugro NV,FUGRO_JV2019_Clickable.pdf,[6],0.0,2019,Fugro,TEXT,"[""In 2019, we made significant progress with the implementation of our Path to Profitable +Growth strategy, supporting the continued recovery of our results. Our marine business +performed significantly better, supported by higher activity levels. In a rapidly changing +world, there are ample opportunities for Fugro to contribute to the safe, reliable, +sustainable and efficient development and operation of our clients""™ assets. Not primarily +through technology or equipment, but by making the most of our people's knowledge, +experience and insight.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +127,What is the company name?,"Implemented new strategy for diversity and inclusion Started up 6 fields, including Johan Sverdrup generating annually 2,700 manyears Successful bid for Empire Wind, with total investments of USD3 billion. Will power over 500,000 homes in New York.",Cenovus Energy,Cenovus Annual Report 2012.pdf,[1],0.0,2012,cenovus ENERGY,TEXT,"[""cenovus energy 2012 annual report""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +128,What is the company name?,Implementing Equinor human rights project ambitions ,Adani,Adani Groupl Adani Enterprises Sustainability Report 2019.pdf,[4],0.0,2018-19,Adani Enterprises Ltd.,TEXT,"[""Sustainability Report FY 19 is a formal and transparent communication of the Sustainability performance of Adani Enterprises Ltd.: Mining Business to its stakeholders. The report has been prepared in accordance with the GRI Standards: Core option. Additionally, environmental performance reflected in the report has been calculated using the factors and values provided in the Green House Gas (GHG) Protocol and Inter-Governmental Panel on Climate Change (IPCC). Various national and local rules, regulations and guidelines have also been followed to assist in AEL- Mining business's environmental and social footprint evaluation. The report contains disclosure for the prioritized material issues- details of which have been provided in the chapter titled 'Stakeholder Engagement and Materiality Assessment.'""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +129,What is the company name?,"In 2018 we became one of the founding patrons of the UN Global Compact Action Platform for Sustainable Ocean Business. The platform is a three-year global programme that brings together business, civil society, the UN and governments to advance the ocean economy and sustainable development. In 2019, Equinor contributed to the development of the Ocean Opportunities Report and UN Global Compact Principles for Sustainable Ocean Business, launched in September 2019. Equinor has signed up to these nine principles.",Chesapeake energy,Chesapeake 2018 Corporate Responsibility Report.pdf,[1],0.0,2018,Chesapeake energy,TEXT,"[""Chesapeake energy""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +130,What is the company name?,"In 2018, the Board of Directors adopted the TATNEFT Group Strategy until 2030, accumulating the Company's ambitious goals based on the previously approved Strategy 2025 that already confirmed its effectiveness at the early stages keeping a steady focus on ensuring a long-term growth in shareholder value. The updated goals are aimed at maximizing business efficiency and return on existing assets. Our priorities are to further strengthen the resource and technological potential, develop innovative forms of production process management and organization, improve margins across all business segments, and sustain a strong position of financial stability and growth of the Company.",Tatneft,PJSC Tatneft annual report 2018.pdf,[19],0.0,2018,TATNEFT,TEXT,"[""In 2018, the Board of Directors adopted the TATNEFT Group +Strategy until 2030, accumulating the Company's ambitious goals +based on the previously approved Strategy 2025 that already +confirmed its effectiveness at the early stages keeping a steady +focus on ensuring a long-term growth in shareholder value. The +updated goals are aimed at maximizing business efficiency and +return on existing assets. Our priorities are to further strengthen +the resource and technological potential, develop innovative forms +of production process management and organization, improve +margins across all business segments, and sustain a strong +position of financial stability and growth of the Company.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +131,What is the company name?,"In 2019, Equinor announced a new partnership with the Aberdeen Science Centre focusing on digitalisation and new technology. Equinor continues its support for NASA in Aberdeen and TechFest. In 2019, participation in the joint Heroes of Tomorrow event with TechFest was doubled to over 400 young people. ",Devon,NYSE_DVN_2016.pdf,[8],0.0,2016,Devon,TEXT,"[""A Delaware corporation formed in 1971, Devon is an independent energy company engaged primarily in the +exploration, development and production of oil, natural gas and NGLs. Our operations are concentrated in various +North American onshore areas in the U.S. and Canada. Additionally, we control EnLink, a publicly-traded MLP +with an integrated midstream business with significant size and scale in key operating regions in the U.S. For +additional information regarding our control of, and ownership interest in, EnLink and its indirect general partner, +the General Partner, see Note 2 in ""Item 8. Financial Statements and Supplementary Data"" of this report.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +132,What is the company name?,"In 2019, the Enel Group continued its growth, hitting all the targets we had set ourselves, despite the deterioration in the competitiveness of conventional generation. This prompted us to write down almost all the Group's coal-fired plants and contributed to the continuing instability in some Latin American economies.",Enel,Enel SpA Annual Report 2019.pdf,[7],0.0,2019,Enel Group,TEXT,"[""In 2019, the Enel Group continued its growth, hitting all the targets we had set ourselves, despite the deterioration in the competitiveness of conventional generation. This prompted us to write down almost all the Group's coal-fired plants and contributed to the continuing instability in some Latin American economies.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +133,What is the company name?,"In 2019, we continued to hold training sessions with select groups, focusing on identifying and managing human rights risks and impacts from our activities and throughout our supply chain. This year, more than 400 employees were trained through a full-day classroom course on Supply Chain Management Ethics, anti-corruption and human rights. This included all safety and sustainability leaders in the business area Technology, Projects and Drilling; the procurement teams in, amongst others, Brazil and Nicaragua; and for personnel involved in supply chain activities at Krst, Norway. Furthermore, personnel from select suppliers in Brazil joined a two-hour training session on human rights in the supply chain. Additionally, Shift Project has delivered a full-day training with over 30 representatives from the Legal function. In total, over 500 employees attended classroom-based targeted training sessions.",CR Power,China Resources Power Holdings Co Ltd Annual Report 2018.pdf,[13],0.0,2018,CR Power,TEXT,"[""While the Chinese power industry is facing imminent challenges, +opportunities also arise. In 2018, CR Power actively responded to +changes caused by power reform and industrial transformation, +accelerated the development of renewable energy, disposed of +inefficient assets, and actively promoted business innovation and +transformation.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +134,What is the company name?,"In 2019, we focused our efforts towards targeted groups and areas, to further improve the effectiveness of our actions. We experienced increased openness to address risks and dilemmas, more active engagement and reflection around company values, and demand for more training to tackle challenges. We consider all these behaviours to be indicators of improvements in embedding a rights-respecting culture.",EnLink,2019_EnLink_Sustainability_Report_-_Issued_May_7_2020.pdf,[4],0.0,2019,EnLink,TEXT,"[""In 2019, EnLink increased +employee focus on sustainable +business practices through the +development and successful +deployment of an employee +education campaign led by +our Sustainability Steering +Committee. We""™ve taken +several steps in further +advancing our goals, including +adding two new directors to our +Board of Directors, increasing +our diversity of experience, +gender, age, and ethnicity. +One of our new directors +brings sustainability experience, +having created a corporate +responsibility committee as a +director at another publicly +traded company.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +135,What is the company name?,"In defining and implementing its strategic vision, Enel carefully integrates and combines all relevant factors: economic-financial, environmental, social and governance-related.",Enel,Enel SA sustainability-report-2017.pdf,[5],0.0,2017,Enel,TEXT,"[""In defining and implementing its strategic vision, Enel carefully integrates and combines all relevant factors: economic-financial, environmental, social and governance-related.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +136,What is the company name?,"In our onshore US operations, significant environmental aspects are related to water sourcing and usage for the hydraulic fracturing process, robust well design and operational procedures to minimise impacts to the environment, and waste management for drill cuttings and produced and flowback water.",Lundin Energy AB,sr_2019_e.pdf,[1],0.0,2019,Lundin Petroleum,TEXT,"[""Lundin Petroleum ""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +137,What is the company name?,"In our opinion the Ethics Helpline reporting works well. Based on a review of the reported concerns and the number of reports received through the Ethics Helpline in 2019, we do not see any immediate need for an adjustment to the management approach. However, we work continuously with improving our processes. ",RWE,RWE-csr_overall-report-2019.pdf,[26],0.0,2019,RWE AG,TEXT,"[""The Executive Board of RWE AG has approved the report for publication.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +138,What is the company name?,"In our supply chain work, we focused more deeply on mitigation, and saw specific actions being defined and progressed based on our targeted worker-based reviews. Until meaningful leading and performance indicator are created, our progress and performance will be assessed on anecdotal evidence. ",Cenovus Energy,Cenovus Annual Report 2016.pdf,[1],0.0,2016,Cenovus Energy,TEXT,"[""cenovus ENERGY""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +139,What is the company name?,"In support of combatting plastic pollution of the oceans we participate in an initiative together with the International Association of Oil and Gas Producers (IOGP), national and EU authorities for assessing the use, regulation, limitations and possible substitution of chemicals factually or potentially containing microplastic. Use of water-soluble products containing microplastic are not allowed in our operations, and we enforce strict restrictions on use of products containing microplastic in oil-based fluids, i.e. fluids not discharged to nature. We share the general concern related to plastic pollution of the ocean and continue the work to identify and substitute chemicals we use that contain microplastics.",LUKOIL,LUKOIL_ANNUAL_REPORT_2018_ENG.pdf,[1],0.0,2018,LUKOIL,TEXT,"[""LUKOIL""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +140,What is the company name?,In the vicinity (5 – 20 km)3 - of protected areas - of areas high biodiversity value ,AES Corporation ,AES Corporation Climate Scenario Report 2018.pdf,[4],0.0,2018,The AES Corporation,TEXT,"[""The AES Corporation (AES) strives every day to improve our customers""™ lives by providing reliable and affordable access to power while setting the bar for innovation in the industry.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +141,What is the company name?,Inside - protected areas - areas of high biodiversity value ,EDF,EDF-urd-annual-financial-report-2019-en-2.pdf,[4],0.0,2019,Électricité de France SA,TEXT,"[""In this Universal Registration Document (the ""Universal Registration Document""), unless otherwise stated, the terms ""Company"" and ""EDF"" refer to Électricité de France SA, and the terms ""EDF group"" and ""Group"" refer to EDF and its subsidiaries and affiliates.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +142,What is the company name?,"Investing in low-carbon research and technology We believe new technologies and innovation will provide future solutions to energy and climate challenges. This is why Equinor’s R&D projects are essential. Equinor’s current ambition is to increase the low carbon (renewable energy, low carbon solutions, and energy efficiency) share of R&D funding to 25% by 2020. ",Enel,Enel annual-report-2017.pdf,[5],0.0,2017,Enel,TEXT,"[""Open to the world, to technology and, internally, among our people. This is the strategic concept of Open Power. But in order to transfer to our customers and stakeholders the essence of a new innovative and open Enel, it is essential to instill this approach to openness within the company.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +143,What is the company name?,It gives us great pleasure to present NOVATEK's Eleventh Sustainability Report 2017 prepared in accordance with the new provisions of the international GRI Standards,NOVATEK,Sustainability_Report_2017_Eng_small[1].pdf,[2],0.0,2017,NOVATEK,TEXT,"[""It gives us great pleasure to present NOVATEK's Eleventh Sustainability Report 2017 prepared in accordance with the new provisions of the international GRI Standards""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +144,What is the company name?,JSC OGK-2,PAO OGK-2,PAO OGK-2_AR 2018.pdf,[2],0.0,2018,JSC OGK-2,TEXT,"[""JSC OGK-2""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +145,What is the company name?,LUKOIL,LUKOIL,LUKOIL_ANNUAL_REPORT_2018_ENG.pdf,[1],0.0,2018,LUKOIL,TEXT,"[""LUKOIL""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +146,What is the company name?,LUKOIL GROUP SUSTAINABILITY REPORT 2018,LUKOIL,Lukoil_sustainability_report_2018.pdf,[1],0.0,2018,LUKOIL,TEXT,"[""LUKOIL GROUP SUSTAINABILITY REPORT 2018""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +147,What is the company name?,Low carbon Creating a low-carbon business advantage Industry leader in carbon efficiency ,BASF SE,2015_BASF_Report.pdf,[1],0.0,2015,BASF,TEXT,"[""BASF Report 2015""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +148,What is the company name?,"Low carbon: To thrive in the energy transition, we aim to maintain our position as one of the industry leaders in carbon efficient oil and gas production, grow in new energy solutions and step up helping accelerating decarbonization of society. ",Total SA,NYSE_TOT_2017 annual.pdf,[1],0.0,2017,Total,TEXT,"[""TOTAL""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +149,What is the company name?,Lundin Petroleum ,Lundin Energy AB,ar_2019_e.pdf,[1],0.0,2019,Lundin Petroleum,TEXT,"[""Lundin Petroleum ""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +150,What is the company name?,Management Board's report on activities of PGE Polska Grupa Energetyczna S.A. and PGE Capital Group for year 2018,PGE,PGE_Mngmnt_Board_consolidated_report_PGE_CG_2018_with comments.pdf,[1],0.0,2018,PGE,TEXT,"[""Management Board's report on activities of PGE Polska Grupa Energetyczna S.A. and PGE Capital Group for year 2018""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +151,What is the company name?,Management of climate-related risks is embedded in Equinor’s enterprise risk management process. We use ,DCP Midstream,2019 DCP Midstream annual report.pdf,[1],0.0,2019,DCP Midstream,TEXT,"[""DCP MIDSTREAM, LP (Exact name of registrant as specified in its charter)""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +152,What is the company name?,"Maturing opportunities in onshore We believe in diversifying our offshore wind business and pursuing additional growth options. Having a flexible portfolio gives us the ability to provide power from numerous renewable energy sources including offshore wind, solar and onshore wind. ",Brigham Minerals,10 K Report.pdf,[15],0.0,2019,Brigham Minerals,TEXT,"[""Brigham Minerals, Inc. was incorporated as a Delaware corporation in June 2018 for the purpose of completing the IPO and related transactions. On April 23, 2019, in connection with the IPO, +Brigham Minerals became a holding company whose sole material asset consists of units in Brigham LLC (the ""Brigham LLC Units""). Brigham LLC wholly owns Brigham Resources, which wholly +owns the Minerals Subsidiaries, which own all of our operating assets. The remainder of the Brigham LLC Units are held by affiliates of Warburg Pincus LLC (""Warburg Pincus""), Yorktown Partners +LLC (""Yorktown""), Pine Brook Road Advisors, LP (""Pine Brook"") and certain of our management members and other prior investors (together with Warburg Pincus, Yorktown and Pine Brook, the +""Original Owners"").""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +153,What is the company name?,"More data is available in our sustainability performance data and in our Payments to governments report, at Equinor.com.",ROMGAZ,2017 Sustainability Report.pdf,[6],0.0,2017,ROMGAZ SA,TEXT,"[""Societatea Naţională de Gaze Naturale “ROMGAZ” SA is a Romanian legal entity, legally +established as a joint stock company, performing its activity in compliance with the Romanian +laws and with the company’s Articles of Incorporation.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +154,What is the company name?,"Naturally occurring water with a low concentration of salts, or generally accepted as suitable for abstraction and treatment to produce potable water. Includes water from public installations, wells (including groundwater reservoirs), lakes, streams, rivers and purchased fresh water. Fresh water produced from salt water on facilities/installations is not included.",Canadian Natural Resources Ltd,Canadian Natural Resources Annual Report 2017.pdf,[2],0.0,2017,Canadian Natural,TEXT,"[""Canadian Natural demonstrated strong operational and financial performance throughout 2017 and completed its transition to a long life low +decline asset base. The Company's focus on disciplined and balanced capital allocation continues, generating sustainable free cash flow for +years to come.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +155,What is the company name?,"Need for efficient climate policies Forceful actions are needed to advance the energy transition, enabling society to combat climate change while promoting affordable energy, economic growth, and sustainable development. ","Aktsionernoe Obshchestvo Rosneftegaz, Moscow",Rosneft_CSR18_EN_Book sustainabilitz 2018.pdf,[1],0.0,2018,Rosneft,TEXT,"[""ROSNEFT""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +156,What is the company name?,"New Energy Solutions’ (NES) gross capital expenditure, before including the effect of project financing.",BP,bp-annual-report-and-form-20f-2018.pdf,[1],0.0,2018,BP,TEXT,"[""BP Annual Report and Form 20-F 2018""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +157,What is the company name?,Norway: 40 % reduction in absolute CO₂ emissions by 2030 Equinor renewable equity generation capacity expected to increase ten-fold from 2019 to 2026 to 4-6GW ,Eni SpA,Annual-Report-2018.pdf,[5],0.0,2018,Eni,TEXT,"[""Eni Annual Report 2018""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +158,What is the company name?,"Number of fatal accidents, lost-time injuries, injuries involving substitute work and medical treatment injuries per million hours worked.",CenterPoint Energy,CenterPoint Energy Corporate Responsibility report 2016.pdf,[1],0.0,2016,CenterPoint Energy,TEXT,"[""CenterPoint Energy 2016 Corporate Responsibility Report""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +159,What is the company name?,"OMV Aktiengesellschaft Trabrennstrasse 6 - 8 1020 Vienna, Austria Tel. +43 1 40440-0 info@omv.com www.omv.com",OMV,Sustainability Report 2016_EN.pdf,[61],0.0,2016,OMV Aktiengesellschaft,TEXT,"[""OMV Aktiengesellschaft Trabrennstrasse 6 - 8 1020 Vienna, Austria Tel. +43 1 40440-0 info@omv.com www.omv.com""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +160,What is the company name?,OMV Sustainability Report 2012 The OMV Sustainability Report covers the 2012 business year and describes our sustainability performance and relevant data,OMV,Sustainability Report 2012_EN.pdf,[2],0.0,2012,OMV,TEXT,"[""OMV Sustainability Report 2012 The OMV Sustainability Report covers the 2012 business year and describes our sustainability performance and relevant data""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +161,What is the company name?,OMV Sustainability Report 2013 This report covers the business year 2013 and updates the priorities set out in our 2012 report.,OMV,Sustainability Report 2013_EN.pdf,[2],0.0,2013,OMV ,TEXT,"[""OMV Sustainability Report 2013 This report covers the business year 2013 and updates the priorities set out in our 2012 report.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +162,What is the company name?,"OMV Sustainability Report 2014 This report covers the operations of OMV Group, headquartered in Vienna, Austria, for the 2014 business year.",OMV,Sustainability Report 2014_EN.pdf,[2],0.0,2014,OMV Group,TEXT,"[""OMV Sustainability Report 2014 This report covers the operations of OMV Group, headquartered in Vienna, Austria, for the 2014 business year.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +163,What is the company name?,"Oil in regulated or controlled discharges to the sea from Equinor operated activities. This includes produced water, process water, displacement water, ballast water, jetting water, drainage water and water discharged from treatment plants. ","Aktsionernoe Obshchestvo Rosneftegaz, Moscow",annual 2018.pdf,[1],0.0,2018,Rosneft,TEXT,"[""ROSNEFT""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +164,What is the company name?,"Open to the world, to technology and, internally, among our people. This is the strategic concept of Open Power. But in order to transfer to our customers and stakeholders the essence of a new innovative and open Enel, it is essential to instill this approach to openness within the company.",Enel,Enel annual-report-2017.pdf,[5],0.0,2017,Enel,TEXT,"[""Open to the world, to technology and, internally, among our people. This is the strategic concept of Open Power. But in order to transfer to our customers and stakeholders the essence of a new innovative and open Enel, it is essential to instill this approach to openness within the company.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +165,What is the company name?,"Other reports The following Equinor reports provide additional information about our business activities and impacts: • Annual report and Form 20-F, including Payments to ",LUKOIL,Lukoil_sustainability_report_2018.pdf,[1],0.0,2018,LUKOIL,TEXT,"[""LUKOIL GROUP SUSTAINABILITY REPORT 2018""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +166,What is the company name?,"Our actions Anti-bribery and corruption compliance - Our ethics and anti-corruption training efforts during 2019 included both general and targeted training sessions through a combination of e-learning and workshops. In 2019, we had particular focus on integrating money laundering into to our anti-corruption workshops to increase awareness of money laundering risk within the organisation. ",Transneft PJSC,annual 2017.pdf,[1],0.0,2017,TRANSNEFT,TEXT,"[""TRANSNEFT EVOLUTION""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +167,What is the company name?,Our ambition is that all teams are diverse and inclusive by 2025,Coal India Limited,Coal India Ltd Annual Report 2018-2019.pdf,[11],0.0,2019,Coal India Limited,TEXT,"[""I am delighted to welcome you all to the 45th Annual General Meeting of Coal India Limited. The Directors""™ Report and the Financial Statement +for the year ended 31st March""™ 2019 together with the report of Statutory Auditors and report and review of Comptroller & Auditor General of +India are already with you. I am sure you are fully aware of the financial & physical health of your company.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +168,What is the company name?,Our business contributes to the Sustainable Development Goals. We believe in transparency and collaboration for greater impact .,CenterPoint Energy,CenterPoint Energy Annual report 2015.pdf,[1],0.0,2015,CenterPoint Energy,TEXT,"[""CenterPoint Energy""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +169,What is the company name?,"Our management approach: Sustainability governance and performance framework At Equinor, our approach to sustainability is embedded in how we work. This includes our corporate governance principles, performance and reward framework and management system. ",Intercontinental Exchange,2019-Annual-Report_Web_BMK_vF.pdf,[2],0.0,2019,Intercontinental Exchange,TEXT,"[""As I look back on the past two decades, they are largely defined by rapid +advancements in technology. From consumer and industrial goods to +healthcare and financial services, advancements in technology have +reshaped and disrupted industries, while also creating new opportunities +for those with the acumen to innovate and successfully execute on a +vision. Twenty years ago, in May of 2000, we launched Intercontinental +Exchange, a name we chose to reflect our vision of better serving global +markets through our innovative, web-based, technology platform. We +aspired to create a more transparent market that was easily accessible +to all participants. In the years since, our focus on leading technology, +customer-driven product innovation and operating efficiency has +remained core to our strategy. We have built new technology from +scratch; we have acquired old technology and refurbished it; and we +have innovated, developing countless new products and content that +seamlessly flow through a global distribution platform. It is our +operating expertise, leading technology infrastructure and innovative +culture that underpin the quality of the networks we operate and, +ultimately, have proven to be our most valuable competitive advantages.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +170,What is the company name?,"Our performance In 2019, we experienced no major accidents or incidents with fatalities 1.",ROMGAZ,2019 Annual Report.pdf,[1],0.0,2019,"Societatea Nationala de Gaze Naturale ""ROMGAZ"" SA ",TEXT,"[""Societatea Nationala de Gaze Naturale ""ROMGAZ"" SA Consolidated Board of Directors""™ Report 2019""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +171,What is the company name?,Our purpose To turn natural resources into energy for people and progress for society. ,ROMGAZ,2018 Annual Report.pdf,[1],0.0,2018,"Societatea Nationala de Gaze Naturale ""ROMGAZ"" SA ",TEXT,"[""Societatea Nationala de Gaze Naturale ""ROMGAZ"" SA Consolidated Board of Directors""™ Report 2018""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +172,What is the company name?,Our strategic response to climate related risks We acknowledge that an energy transition is ongoing and want to be in the forefront of this change. We believe that the energy transition represents opportunities for ,PGE,PGE_Mngmnt_Board_consolidated_report_PGE_CG_2018_with comments.pdf,[6],0.0,2018,PGE,TEXT,"[""Capital Group of PGE Polska Grupa Energetyczna S.A. (""PGE Capital Group"", the ""Capital Group"", ""PGE Group"", the ""Group"") is the largest vertically integrated producer of electricity and heat in Poland.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +173,What is the company name?,"Our sustainability priority areas reflect our main contributions to, and impact on society and entail significant business risks and opportunities.",Tatneft,PJSC Tatneft annual report 2018.pdf,[19],0.0,2018,TATNEFT,TEXT,"[""In 2018, the Board of Directors adopted the TATNEFT Group +Strategy until 2030, accumulating the Company's ambitious goals +based on the previously approved Strategy 2025 that already +confirmed its effectiveness at the early stages keeping a steady +focus on ensuring a long-term growth in shareholder value. The +updated goals are aimed at maximizing business efficiency and +return on existing assets. Our priorities are to further strengthen +the resource and technological potential, develop innovative forms +of production process management and organization, improve +margins across all business segments, and sustain a strong +position of financial stability and growth of the Company.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +174,What is the company name?,"Owner and publisher OMV Aktiengesellschaft Head Office TrabrennstraŸe 6-8 1020 Vienna, Austria info.sustainability@omv.com",OMV,Sustainability Report 2014_EN.pdf,[77],0.0,2014,OMV Aktiengesellschaft,TEXT,"[""Owner and publisher OMV Aktiengesellschaft Head Office Trabrennstraße 6-8 1020 Vienna, Austria info.sustainability@omv.com""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +175,What is the company name?,"Owner and publisher OMV Aktiengesellschaft TrabrennstraŸe 6-8 1020 Vienna, Austria info.sustainability@omv.com",OMV,Sustainability Report 2013_EN.pdf,[101],0.0,2013,OMV Aktiengesellschaft,TEXT,"[""Owner and publisher OMV Aktiengesellschaft Trabrennstraße 6-8 1020 Vienna, Austria info.sustainability@omv.com""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +176,What is the company name?,"Owner and publisher: OMV Aktiengesellschaft Trabrennstrasse 6-8 1020 Vienna, Austria info.sustainability@omv.com",OMV,Sustainability Report 2012_EN.pdf,[106],0.0,2012,OMV Aktiengesellschaft,TEXT,"[""Owner and publisher: OMV Aktiengesellschaft Trabrennstrasse 6-8 1020 Vienna, Austria info.sustainability@omv.com""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +177,What is the company name?,PAO NOVATEK ANNUAL REPORT 2017,NOVATEK,AR_FS_2017_ENG.pdf,[1],0.0,2017,PAO NOVATEK,TEXT,"[""PAO NOVATEK ANNUAL REPORT 2017""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +178,What is the company name?,PAO NOVATEK ANNUAL REPORT 2018,NOVATEK,04_NOVATEK_AR_2018_ENG_15.pdf,[1],0.0,2018,PAO NOVATEK,TEXT,"[""PAO NOVATEK ANNUAL REPORT 2018""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +179,What is the company name?,"PGE Group as of the end of 2018 consisted of: ‚ PGE S.A. - the parent company, ‚ 57 subsidiaries subject to consolidation, ‚ 4 associates, ‚ 1 jointly controlled entity.",PGE,PGE_Mngmnt_Board_consolidated_report_PGE_CG_2018_with comments.pdf,[7],0.0,2018,PGE Group,TEXT,"[""PGE Group as of the end of 2018 consisted of: ï‚¡ PGE S.A. - the parent company, ï‚¡ 57 subsidiaries subject to consolidation, ï‚¡ 4 associates, ï‚¡ 1 jointly controlled entity.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +180,What is the company name?,PJSC Gazprom Annual Report 2018,Gazprom PJSC,gazprom-annual-report-2018-en.pdf,[1],0.0,2018,PJSC GAZPROM,TEXT,"[""PJSC Gazprom Annual Report 2018""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +181,What is the company name?,PJSC Gazprom Environmental Report 2018,Gazprom PJSC,gazprom-environmental-report-2018-en.pdf,[1],0.0,2018,PJSC GAZPROM,TEXT,"[""PJSC Gazprom Environmental Report 2018""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +182,What is the company name?,Percentage of employees completed the code of conduct course (%),RWE,RWE-csr_overall-report-2019.pdf,[27],0.0,2019,RWE Group,TEXT,"[""This report contains forward-looking statements regarding the future development of the RWE Group and its companies as well as future economic and political developments""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +183,What is the company name?,Publisher RWE Aktiengesellschaft Altenessener Str. 35 45141 Essen Germany,RWE,RWE-csr_overall-report-2019.pdf,[110],0.0,2019,RWE Aktiengesellschaft,TEXT,"[""Publisher RWE Aktiengesellschaft Altenessener Str. 35 45141 Essen Germany""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +184,What is the company name?,ROSNEFT,"Aktsionernoe Obshchestvo Rosneftegaz, Moscow",annual_report_2019_eng.pdf,[1],0.0,2019,Rosneft,TEXT,"[""ROSNEFT""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +185,What is the company name?,ROSNEFT FOR THE BENEFIT OF RUSSIA,"Aktsionernoe Obshchestvo Rosneftegaz, Moscow",annual 2016.pdf,[1],0.0,2016,Rosneft,TEXT,"[""ROSNEFT FOR THE BENEFIT OF RUSSIA""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +186,What is the company name?,ROSNEFT SUSTAINABILITY REPORT,"Aktsionernoe Obshchestvo Rosneftegaz, Moscow",sustainability 2015.pdf,[1],0.0,2015,Rosneft,TEXT,"[""ROSNEFT SUSTAINABILITY REPORT""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +187,What is the company name?,ROSNEFT SUSTAINABILITY REPORT 2016,"Aktsionernoe Obshchestvo Rosneftegaz, Moscow",RN_SR_2016_EN(2) sustainabilitz 2016.pdf,[1],0.0,2016,Rosneft,TEXT,"[""ROSNEFT SUSTAINABILITY REPORT 2016""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +188,What is the company name?,RWE AG is meeting the obligation to publish a Non-financial Report envisaged pursuant to the German Commercial Code (HGB) in a separate section of this CR report.,RWE,RWE-csr_overall-report-2019.pdf,[26],0.0,2019,RWE AG,TEXT,"[""RWE AG is meeting the obligation to publish a Non-financial Report envisaged pursuant to the German Commercial Code (HGB) in a separate section of this CR report.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +189,What is the company name?,RWE AG | Factbook | March 2019,RWE,RWE-factbook_report-2018.pdf,[1],0.0,2019,RWE AG,TEXT,"[""RWE AG | Factbook | March 2019""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +190,What is the company name?,RWE Aktiengesellschaft,RWE,RWE-csr_overall-report-2019.pdf,[36],0.0,2019,RWE Aktiengesellschaft,TEXT,"[""RWE Aktiengesellschaft""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +191,What is the company name?,"Reduce the net carbon intensity, from initial production to final consumption, of energy produced by at least 50% by 2050",BP,bp-sustainability-report-2019.pdf,[1],0.0,2019,BP,TEXT,"[""BP Sustainability Report 2019""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +192,What is the company name?,"Reduced flaring We have set a company-wide upstream flaring intensity target of 0.2% by 2020 for our operated assets. This was set in 2012 as part of our commitment to the Sustainable Energy for All Initiative. Our aim is to eliminate routine flaring in our operations by 2030 at the latest, in line with the World Bank’s Zero Routine Flaring by 2030 Initiative. In Norway we do not have routine flaring in our operations. We have been working systematically to reduce flaring on the Norwegian Continental Shelf (NCS) as well and have seen a positive trend. Reductions have been achieved mostly by changing our operating procedures, such as when starting a well, and due to hardware changes, ","Aktsionernoe Obshchestvo Rosneftegaz, Moscow",annual_report_2019_eng.pdf,[1],0.0,2019,Rosneft,TEXT,"[""ROSNEFT""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +193,What is the company name?,Reducing net carbon intensity by at least 50% by 2050,NOVATEK,Sustainability_Report_2017_Eng_small[1].pdf,[10],0.0,2017,NOVATEK,TEXT," [""NOVATEK is one of Russia's largest independent natural gas producers. Ranking third by proved SEC natural gas reserves, it is also one of the top 10 world's largest publicly traded oil and gas companies in terms of gas production boasting one of the industry's lowest exploration and development costs.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +194,What is the company name?,Regular updates of meteorology and oceanography data used in project design and operational planning ,DCP Midstream,2017 DCP Midstream annual report.pdf,[1],0.0,2017,DCP Midstream,TEXT,"[""DCP MIDSTREAM, LP +(Exact name of registrant as specified in its charter)""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +195,What is the company name?,"Renewable energy and low-carbon research and development (R&D) In 2019, Equinor’s renewable energy production (equity basis) increased from 1.3 to 1.8 TWh. The increase is due to a growing portfolio and the first full year of production at Arkona. Capital expenditure on new energy solutions in 2019 was around USD 0.3 billion. The increase is in line with the strategic direction of growing in renewables, and the management approach is assessed to be effective. Our low-carbon and energy efficiency R&D expenditure was around 20% in 2019, which is a small decrease from ",Snam,2017_sustainability_report.pdf,[2],0.0,2017,Snam,TEXT,"[""Snam is Europe's leading gas utility.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +196,What is the company name?,"Renewable energy is expected to grow significantly in all scenarios, especially in the electricity sector where solar and wind takes on a leading role. In 2018, solar and wind accounted for about 7% of the global electricity mix. This is projected to grow to a share of between 30% to 50% depending on the scenario. The growth in electricity from solar and wind power is driven by technological improvements, reduced cost and continued regulatory support. ",Callon Petroleum Co,Callon Petroleum Co Annual Report 2017.pdf,[2],0.0,2017,Callon Petroleum,TEXT,"[""Callon Petroleum is an independent oil and natural gas company focused on the acquisition, +exploration and development of high-quality assets in the heart of the Permian Basin. +Our mission is to build trust, create value, and drive sustainable growth for our investors, +our employees and the communities in which we operate.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +197,What is the company name?,"Reporting and handling of concerns – The Code of Conduct imposes a duty to report possible violations of the Code or other unethical conduct. We require leaders to take their control responsibilities seriously to prevent, detect and respond to ethical issues. Employees are encouraged ",PGE,PGE_Mngmnt_Board_consolidated_report_PGE_CG_2018_with comments.pdf,[1],0.0,2018,PGE,TEXT,"[""Management Board's report on activities of PGE Polska Grupa Energetyczna S.A. and PGE Capital Group for year 2018""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +198,What is the company name?,"Safety indicators that improve proactivity; leading indicators, have been given higher priority through increased attention to and follow-up of known underlying causes behind incidents. ",OMV,Sustainability Report 2015_EN.pdf,[51],0.0,2015,OMV Aktiengesellschaft,TEXT,"[""Owner and publisher OMV Aktiengesellschaft Trabrennstraße 6-8 1020 Vienna, Austria info.sustainability@omv.com""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +199,What is the company name?,"Safety visibility has been improved through the implementation of a broad set of actions in all locations. This includes ""Life-Saving Rules"" based on the industry standard from International Oil and Gas Producers association which has been rolled out throughout the company. ",Saipem SpA,SaipemSustainability2018.pdf,[72],0.0,2018,saipem SpA,TEXT,"[""saipem SpA +Via Martiri di Cefalonia, 67 +20097 San Donato Milanese +Milan - Italy""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +200,What is the company name?,"Security Equinor continues to face a range of physical and cyber security threats that are continuously monitored, evaluated and communicated across the company. ",Transneft PJSC,sustainable development 2017.pdf,[1],0.0,2017,Transneft,TEXT,"[""TRANSNEFT +EVOLUTION""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +201,What is the company name?,Snam is Europe's leading gas utility.,Snam,2017_sustainability_report.pdf,[2],0.0,2017,Snam,TEXT,"[""Snam is Europe's leading gas utility.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +202,What is the company name?,"Snam's business model is based on sustainable growth, transparency, nurturing talent, and development of local areas by constantly listening to and exchanging dialogues with local communities, also thanks to the social initiatives of the Snam Foundation.",Snam,2018_sustainability_report.pdf,[2],0.0,2018,Snam,TEXT,"[""Snam's business model is based on sustainable growth, transparency, nurturing talent, and development of local areas by constantly listening to and exchanging dialogues with local communities, also thanks to the social initiatives of the Snam Foundation.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +203,What is the company name?,"Societatea Naţională de Gaze Naturale ROMGAZ SA is a Romanian legal entity, legally established as a joint stock company, performing its activity in compliance with the Romanian laws and with the company’s Articles of Incorporation.",ROMGAZ,2017 Sustainability Report.pdf,[6],0.0,2017,ROMGAZ SA,TEXT,"[""Societatea Naţională de Gaze Naturale “ROMGAZ” SA is a Romanian legal entity, legally +established as a joint stock company, performing its activity in compliance with the Romanian +laws and with the company’s Articles of Incorporation.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +204,What is the company name?,Societe Generale implemented its commitment announced in correlation with the COP21 to align its financing in order to contribute towards limiting the global temperature rise to less than 2C by 2100.,Societe Generale,SG-RSE2016-2017-EN.pdf,[3],0.0,2016,Societe Generale,TEXT,"[""Societe Generale implemented its commitment announced in correlation with the COP21 to align its financing in order to contribute towards limiting the global temperature rise to less than 2°C by 2100.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +205,What is the company name?,Some people are still disputing global warming. We’re acting on it.,"Aktsionernoe Obshchestvo Rosneftegaz, Moscow",RN_SR_2016_EN(2) sustainabilitz 2016.pdf,[1],0.0,2016,Rosneft,TEXT,"[""ROSNEFT SUSTAINABILITY REPORT 2016""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +206,What is the company name?,South Riding Point terminal is being investigated and the final classification is not concluded. ,Elektrik Üretim A.Ş.,Elektrik Üretim A.Ş. Genel Müdürlüğü (EÜAŞ) Annual Report 2018.pdf,[1],0.0,2018,ELEKTRİK ÜRETİM A.Ş.,TEXT,"[""ELEKTRİK ÜRETİM A.Ş. ELECTRICITY GENERATION CO.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +207,What is the company name?,"Southern Company is transitioning our energy generation fleet for a low-carbon future. In doing so, we have established an intermediate goal of a 50 percent reduction in carbon emissions from 2007 levels by 2030 and a long-term goal of low- to no-carbon operations by 2050.",Southern Company,Southern Company_2018_Corporate_Responsibility_Report.pdf,[1],0.0,2018,Southern Company,TEXT,"[""Southern Company is transitioning our energy generation fleet for a low-carbon future. In doing so, we have established an intermediate goal of a 50 percent reduction in carbon emissions from 2007 levels by 2030 and a long-term goal of low- to no-carbon operations by 2050.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +208,What is the company name?,"Strategy – Disclose the actual and potential impacts of climate-related risks and opportunities on the organisation’s businesses, strategy, and financial planning where such information is material ","Aktsionernoe Obshchestvo Rosneftegaz, Moscow",sustainability 2015.pdf,[1],0.0,2015,Rosneft,TEXT,"[""ROSNEFT SUSTAINABILITY REPORT""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +209,What is the company name?,Supplier human rights (HR) verifications conducted,OMV,Sustainability Report 2014_EN.pdf,[2],0.0,2014,OMV Group,TEXT,"[""OMV Sustainability Report 2014 This report covers the operations of OMV Group, headquartered in Vienna, Austria, for the 2014 business year.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +210,What is the company name?,Supplier human rights verifications conducted (number of),RWE,RWE-csr_overall-report-2019.pdf,[110],0.0,2019,RWE Aktiengesellschaft,TEXT,"[""Publisher RWE Aktiengesellschaft Altenessener Str. 35 45141 Essen Germany""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +211,What is the company name?,"Sustainability Report FY 19 is a formal and transparent communication of the Sustainability performance of Adani Enterprises Ltd.: Mining Business to its stakeholders. The report has been prepared in accordance with the GRI Standards: Core option. Additionally, environmental performance reflected in the report has been calculated using the factors and values provided in the Green House Gas (GHG) Protocol and Inter-Governmental Panel on Climate Change (IPCC). Various national and local rules, regulations and guidelines have also been followed to assist in AEL- Mining business's environmental and social footprint evaluation. The report contains disclosure for the prioritized material issues- details of which have been provided in the chapter titled 'Stakeholder Engagement and Materiality Assessment.'",Adani,Adani Groupl Adani Enterprises Sustainability Report 2019.pdf,[4],0.0,2018-19,Adani Enterprises Ltd.,TEXT,"[""Sustainability Report FY 19 is a formal and transparent communication of the Sustainability performance of Adani Enterprises Ltd.: Mining Business to its stakeholders. The report has been prepared in accordance with the GRI Standards: Core option. Additionally, environmental performance reflected in the report has been calculated using the factors and values provided in the Green House Gas (GHG) Protocol and Inter-Governmental Panel on Climate Change (IPCC). Various national and local rules, regulations and guidelines have also been followed to assist in AEL- Mining business's environmental and social footprint evaluation. The report contains disclosure for the prioritized material issues- details of which have been provided in the chapter titled 'Stakeholder Engagement and Materiality Assessment.'""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +212,What is the company name?,Sustainability performance data Performance data in this report and supplementary data are presented online at sustainability.equinor.com.,NOVATEK,Sustainability_Report_2017_Eng_small[1].pdf,[2],0.0,2017,NOVATEK,TEXT,"[""It gives us great pleasure to present NOVATEK's Eleventh Sustainability Report 2017 prepared in accordance with the new provisions of the international GRI Standards""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +213,What is the company name?,TATNEFT Company successfully accomplished all of the planned programs in 2015. In the difficult macroeconomic environment the Company implemented a set of production and economic compensatory measures to maintain the Company's status in the group of the leaders of the Russian fuel and energy complex.,Tatneft,PJSC Tatneft annual report 2015.pdf,[3],0.0,2015,TATNEFT,TEXT,"[""TATNEFT Company successfully accomplished all of the planned programs in 2015. In the difficult macroeconomic +environment the Company implemented a set of production and economic compensatory measures to maintain +the Company's status in the group of the leaders of the Russian fuel and energy complex.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +214,What is the company name?,TEEKAY CORPORATION 2017 Sustainability Report,Teekay Corp,2017-Sustainability-Report.pdf,[1],0.0,2017,TEEKAY CORPORATION,TEXT,"[""TEEKAY CORPORATION 2017 Sustainability Report""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +215,What is the company name?,TEEKAY CORPORATION 2018 Sustainability Report,Teekay Corp,Teekay-Corporation-2018-Sustainability-Report.pdf,[1],0.0,2018,TEEKAY CORPORATION,TEXT,"[""TEEKAY CORPORATION +2018 Sustainability Report""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +216,What is the company name?,TGS ANNUAL REPORT / 2019,TGS NOPEC Geophysical Co ASA,TGS-AR2019-FINAL-WEB-PAGES-reduced annual.pdf,[1],0.0,2019,TGS,TEXT,"[""TGS ANNUAL REPORT / 2019""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +217,What is the company name?,THE AES CORPORATION,AES Corporation ,AES Corporation Annual Report 2018.pdf,[1],0.0,2018,THE AES CORPORATION,TEXT,"[""THE AES CORPORATION""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +218,What is the company name?,TOTAL,Total SA,NYSE_TOT_2016 annual.pdf,[1],0.0,2016,Total,TEXT,"[""TOTAL""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +219,What is the company name?,TOTAL COMMITTED TO BETTER ENERGY,Total SA,NYSE_TOT_2015 annual.pdf,[1],0.0,2015,Total,TEXT,"[""TOTAL +COMMITTED TO BETTER ENERGY""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +220,What is the company name?,TRANSNEFT,Transneft PJSC,annual 2018.pdf,[1],0.0,2018,Transneft,TEXT,"[""TRANSNEFT""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +221,What is the company name?,TRANSNEFT EVOLUTION,Transneft PJSC,sustainable development 2017.pdf,[1],0.0,2017,Transneft,TEXT,"[""TRANSNEFT +EVOLUTION""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +222,What is the company name?,"Tax transparency and payments to governments reporting - We believe that through disclosure of payments to governments we promote accountability and build trust in the societies where we operate. We have reported our payments to governments on a country-by-country basis for more than a decade. Since 2014, we have reported such payments on a project-by-project and legal entities basis, in our Annual Report and Form 20F. This reporting represents a core element of transparent corporate tax disclosure. Since 2018, we have published our global tax strategy, available online. These disclosures are in line with our commitment to conduct our business activities in a transparent way. ",Societe Generale,SG-RSE2016-2017-EN.pdf,[3],0.0,2016,Societe Generale,TEXT,"[""For Societe Generale, being a responsible company lies at the very heart of our business lines""™ mission and reflects the essence of the relationship bank of reference that we strive to be.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +223,What is the company name?,"The AES Corporation (NYSE: AES) is a Fortune 200 global power company founded in 1981. The company's headquarters are in Arlington, Virginia, United States (US). AES is publicly traded company, incorporated in Delaware and governed by a Board of Directors.",AES Corporation ,AES Corporation 2018_SustainabilityReport_vFinal.pdf,[4],0.0,2018,The AES Corporation,TEXT,"[""The AES Corporation (NYSE: AES) is a Fortune 200 global power company founded in 1981. The company's headquarters are in Arlington, Virginia, United States (US). AES is publicly traded company, incorporated in Delaware and governed by a Board of Directors.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +224,What is the company name?,The CR Report of RWE AG is published as a GRI Report and conforms with the GRI Standards (2016) of the Global Reporting Initiative in a selection based on a Materiality Analysis of the topics relevant for our business.,RWE,RWE-csr_overall-report-2019.pdf,[26],0.0,2019,RWE AG,TEXT,"[""The CR Report of RWE AG is published as a GRI Report and conforms with the GRI Standards (2016) of the Global Reporting Initiative in a selection based on a Materiality Analysis of the topics relevant for our business.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +225,What is the company name?,"The Company's achievements and outlook were highly rated by the stock market. Over the course of the year, TATNEFT's stock price has been among the best performers among Russian oil and gas companies.",Tatneft,PJSC Tatneft annual report 2017.pdf,[3],0.0,2017,TATNEFT,TEXT,"[""The Company's achievements and outlook were highly rated +by the stock market. Over the course of the year, TATNEFT's +stock price has been among the best performers among +Russian oil and gas companies.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +226,What is the company name?,"The Enel Group structure is organized into a matrix that comprises: >>Business Lines (Global Thermal Generation, Global Trading, Global Infrastructure and Networks, Enel Green Power, Enel X), which are responsible for managing and developing assets, optimizing their performance and the return on capital employed in the various geographical areas in which the Group operates. The Business Lines are also responsible for improving the efficiency of the processes they manage and sharing best practices at the global level. The Group will benefit from a centralized industrial vision of projects in the various Business Lines. Each project will be assessed not only on the basis of its financial return but also in relation to the best technologies available at the Group level, >>Regions and Countries (Italy, Iberia, South America, Europe and Euro-Mediterranean Affairs, North and Central America, Africa, Asia and Oceania), which are responsible for managing relationships with institutional bodies and regulatory authorities, as well as selling electricity and gas, in each of the countries in which the Group operates, while also providing staff and other service support to the Business Lines.",Enel,Enel annual-report-2018.pdf,[9],0.0,2018,Enel Group,TEXT,"[""The Enel Group structure is organized into a matrix that comprises: +>>Business Lines (Global Thermal Generation, Global Trading, Global Infrastructure and Networks, Enel Green Power, Enel X), which are responsible for managing and developing assets, optimizing their performance and the return on capital employed in the various geographical areas in which the Group operates. The Business Lines are also responsible for improving the efficiency of the processes they manage and sharing best practices at the global level. The Group will benefit from a centralized industrial vision of projects in the various Business Lines. Each project will be assessed not only on the basis of its financial return but also in relation to the best technologies available at the Group level, +>>Regions and Countries (Italy, Iberia, South America, Europe and Euro-Mediterranean Affairs, North and Central America, Africa, Asia and Oceania), which are responsible for managing relationships with institutional bodies and regulatory authorities, as well as selling electricity and gas, in each of the countries in which the Group operates, while also providing staff and other service support to the Business Lines.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +227,What is the company name?,The Executive Board of RWE AG has approved the report for publication.,RWE,RWE-csr_overall-report-2019.pdf,[26],0.0,2019,RWE AG,TEXT,"[""The Executive Board of RWE AG has approved the report for publication.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +228,What is the company name?,"The Mariner project supports around 700 long term jobs and between 80-90% of the contracts for offshore work during the production phase were awarded to UK-based suppliers. The project will create ripple effects in the local supply chain for the next 30 years of production. In the UK, Equinor works closely with the local supply chain and peers, focusing on collaboration and digitalisation to improve industry performance. ",Wintershall Dea,Wintershall-Dea_Sustainability_Report_2019.pdf,[1],0.0,2019,Wintershall Dea,TEXT,"[""wintershall dea""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +229,What is the company name?,The PJSC TATNEFT's securities are listed in the Russian and international stock markets. The Company's ordinary and preferred shares are traded on the Moscow Stock Exchange and are quoted on the highest list of the first (I) level. 28.5% of the voting shares were deposited to be converted to global American Depository Receipts (ADR). The Company's depositary receipts are included in the listing of the London Stock Exchange (ATAD).,Tatneft,PJSC Tatneft annual report 2016.pdf,[4],0.0,2016,TAFTNEFT,TEXT,"[""The PJSC TATNEFT's securities are listed in the Russian and international stock markets. +The Company's ordinary and preferred shares are traded on the Moscow Stock Exchange +and are quoted on the highest list of the first (I) level. 28.5% of the voting shares were +deposited to be converted to global American Depository Receipts (ADR). The Company's +depositary receipts are included in the listing of the London Stock Exchange (ATAD).""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +230,What is the company name?,"The company has a separate corporate risk committee chaired by the chief financial officer. The committee meets at least three times per year to give advice and make recommendations on Equinor’s enterprise risk management, including climate-related risks.",Cenovus Energy,Cenovus Sustainability Report 2018.pdf,[1],0.0,2018,Cenovus Energy,TEXT,"[""cenovus ENERGY""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +231,What is the company name?,"The corporate sustainability function is responsible for overseeing climate change (including climate-related risk), environment, human rights and social issues. The corporate safety function is responsible for safety, health, work environment and security. The chief compliance officer is responsible for business ethics and compliance. ",VERBUND,VERBUND-Integrated-Annual-Report-2018-English.pdf,[9],0.0,2018,VERBUND,TEXT,"[""This integrated annual report contains the Group management report published by VERBUND for +financial year 2018, the Group report on non-financial information (NFI Report) and the Group's +consolidated financial statements, including the notes to the consolidated financial statements. The +principles of fair enterprise management followed by VERBUND are laid out in the Corporate Governance +Report. This integrated annual report thus not only presents the Group's financial and legal information +but also deals with further aspects of sustainability and proper conduct of business operations.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +232,What is the company name?,"The effective interface between security disciplines has been further strengthened through the modification of our security risk assessment tool to combine physical, IT and personal security risk assessments. We have also focused on competency assurance for security risk management experts which is intended to drive standardization and quality.",RWE,RWE-csr_overall-report-2019.pdf,[26],0.0,2019,RWE Group,TEXT,"[""Owing to the fact that Group (financial) reporting is taking place with the two temporary positions ""innogy - continuing operations"" and ""Operations acquired from E.ON"", explicit reference is made to these items and this then refers to the RWE Group overall.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +233,What is the company name?,"The figure includes CO₂ costs and other environmental costs paid by Equinor in 2019. Costs are reported for Equinor-operated assets only, on a 100% basis. This includes EU Emission Allowances System (EU ETS) quotas, Norwegian CO₂ tax and a CO₂ related royalty fee in Brazil. ",Royal Dutch Shell plc,shell_annual_report_2018.pdf,[1],0.0,2018,Royal Dutch Shell plc,TEXT,"[""Annual Report and Form 20-F for the year ended December 31, 2018, Royal Dutch Shell plc""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +234,What is the company name?,"The following factors, in addition to those discussed elsewhere in this Quarterly Report on Form 10-Q and in other securities filings (including Xcel Energy's Annual Report on Form 10-K for the fiscal year ended Dec. 31, 2019",XCEL,Xcel_2019_CorporateResponsibility_Report_FullFinal.pdf,[2],0.0,2019,Xcel Energy,TEXT,"[""The following factors, in addition to those discussed elsewhere in this Quarterly Report on Form 10-Q and in other securities filings (including Xcel Energy's Annual Report on Form 10-K for the fiscal year ended Dec. 31, 2019""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +235,What is the company name?,"The methane intensity (operated) remained very low at around 0.03%, which is significantly lower than the industry average of around 0.3% as measured by the Oil and Gas Climate Initiative (OGCI 2018 Annual Report). ",VERBUND,VERBUND-Integrated-Annual-Report-2019-Englisch.pdf,[9],0.0,2019,VERBUND,TEXT,"[""This integrated annual report contains the Group management report published by VERBUND for financial +year 2019, the Group report on non-financial information (NFI Report) and the Group's consolidated +financial statements, including the notes to the consolidated financial statements. The principles of fair +enterprise management followed by VERBUND are laid out in the Corporate Governance Report. This +integrated annual report thus not only presents the Group's financial and legal information but also deals +with further aspects of sustainability and proper conduct of business operations.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +236,What is the company name?,"The volume of drill cuttings from US onshore operations, classified as exempt waste, increased by 53% in 2019. The increase is mainly due to cuttings being transported as waste to landfill sites rather than collected in on-site disposal pits. Management of such waste varies with location and landowner preferences and causes year to year variations in solid exempt waste. The disposal of liquid exempt waste has increased by 17% since 2018 due to higher amount of produced water from wells. Use of fracking chemicals has decreased by 15% due to reduced fracking activity at Bakken and Eagle Ford in 2019.",TGS NOPEC Geophysical Co ASA,TGS-AR2019-FINAL-WEB-PAGES-reduced annual.pdf,[1],0.0,2019,TGS,TEXT,"[""TGS ANNUAL REPORT / 2019""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +237,What is the company name?,The world needs energy providers that can deliver energy with lower emissions,Duke Energy,2017-DukeSR.pdf,[3],0.0,2017,Duke Energy,TEXT,"[""I am pleased to share Duke Energy's 12th Sustainability Report. This year's report reflects a theme we""™ve been +observing over the past dozen years: The energy industry is in transition and the successful companies are those +that continue to recognize and adapt to the changing expectations of the customers and communities they serve.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +238,What is the company name?,"These are therefore not included in the hazardous or non-hazardous waste and waste recovery figures. In 2016 a change was made in the categorisation of recovered waste, allowing for the inclusion of treated oil contaminated water.",ENDESA,Endesa SA Annual Report 2017.pdf,[1],0.0,2017,ENDESA,TEXT,"[""Corporate Name: ENDESA, S.A.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +239,What is the company name?,"This integrated annual report contains the Group management report published by VERBUND for financial year 2018, the Group report on non-financial information (NFI Report) and the Group's consolidated financial statements, including the notes to the consolidated financial statements. The principles of fair enterprise management followed by VERBUND are laid out in the Corporate Governance Report. This integrated annual report thus not only presents the Group's financial and legal information but also deals with further aspects of sustainability and proper conduct of business operations.",VERBUND,VERBUND-Integrated-Annual-Report-2018-English.pdf,[9],0.0,2018,VERBUND,TEXT,"[""This integrated annual report contains the Group management report published by VERBUND for +financial year 2018, the Group report on non-financial information (NFI Report) and the Group's +consolidated financial statements, including the notes to the consolidated financial statements. The +principles of fair enterprise management followed by VERBUND are laid out in the Corporate Governance +Report. This integrated annual report thus not only presents the Group's financial and legal information +but also deals with further aspects of sustainability and proper conduct of business operations.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +240,What is the company name?,"This integrated annual report contains the Group management report published by VERBUND for financial year 2019, the Group report on non-financial information (NFI Report) and the Group's consolidated financial statements, including the notes to the consolidated financial statements. The principles of fair enterprise management followed by VERBUND are laid out in the Corporate Governance Report. This integrated annual report thus not only presents the Group's financial and legal information but also deals with further aspects of sustainability and proper conduct of business operations.",VERBUND,VERBUND-Integrated-Annual-Report-2019-Englisch.pdf,[9],0.0,2019,VERBUND,TEXT,"[""This integrated annual report contains the Group management report published by VERBUND for financial +year 2019, the Group report on non-financial information (NFI Report) and the Group's consolidated +financial statements, including the notes to the consolidated financial statements. The principles of fair +enterprise management followed by VERBUND are laid out in the Corporate Governance Report. This +integrated annual report thus not only presents the Group's financial and legal information but also deals +with further aspects of sustainability and proper conduct of business operations.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +241,What is the company name?,"This report contains certain forward-looking statements that involve risks and uncertainties. In some cases, we use words such as aim, ambition, continue, expect, may, strategy, will, in line with, and similar expressions to identify forward-looking statements. Forward-looking statements include all statements other than statements of historical fact, including, among others, statements regarding Equinor’s ambitions, plans, intentions, aims and expectations with respect to Equinor’s new climate roadmap, including with respect to its net carbon intensity, carbon efficiency, methane emissions and flaring reductions, renewable energy capacity, carbon-neutral global operations, internal carbon price on investment decisions, future levels of, and expected value creation from, oil and gas production, scale and composition of the oil and gas portfolio, development of CCUS and hydrogen businesses, use of offset mechanisms and natural sinks and support of TCFD recommendations.",Apache,2017_SustainabilityReport_2_9_Web.pdf,[5],0.0,2017,Apache,TEXT,"[""Welcome to Apache's 2017 sustainability report. +To view the report online, please visit the Apache +website at www.apachecorp.com/sustainability""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +242,What is the company name?,This report contains forward-looking statements regarding the future development of the RWE Group and its companies as well as future economic and political developments,RWE,RWE-csr_overall-report-2019.pdf,[27],0.0,2019,RWE Group,TEXT,"[""This report contains forward-looking statements regarding the future development of the RWE Group and its companies as well as future economic and political developments""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +243,What is the company name?,"This report covers the operations of the OMV Group, headquartered in Vienna, Austria, for the 2018 business year.",OMV,dload_Sustainability Report 2018_en.pdf,[2],0.0,2018,OMV Group,TEXT,"[""This report covers the operations of the OMV Group, headquartered in Vienna, Austria, for the 2018 business year.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +244,What is the company name?,"This year Equinor also signed contracts for the Hywind Tampen wind farm development. This project will contribute to further developing floating offshore wind technology and reducing the costs of future floating offshore wind farms, offering new industrial opportunities for Norway, the licenses and the Norwegian supplier industry in a growing global offshore wind market.",Approach Resources Inc,NASDAQ_AREX_2015 annual.pdf,[9],0.0,2015,Approach Resources Inc.,TEXT,"[""Approach Resources Inc. is an independent energy company focused on the exploration, development, +production and acquisition of unconventional oil and gas reserves in the Midland Basin of the greater Permian +Basin in West Texas, where we lease approximately 126,000 net acres as of December 31, 2015. We believe our +concentrated acreage position provides us an opportunity to achieve cost, operating and recovery efficiencies in +the development of our drilling inventory. Our long-term business strategy is to develop resource potential from +the Wolfcamp shale oil formation. See """"” Our Business Strategy"" below. Additional drilling targets could +include the Clearfork, Canyon Sands, Strawn and Ellenburger zones. We sometimes refer to our development +project in the Permian Basin as ""Project Pangea,"" which includes ""Pangea West."" Our management and technical +team have a proven track record of finding and developing reserves through advanced drilling and completion +techniques. As the operator of all of our estimated proved reserves and production, we have a high degree of +control over capital expenditures and other operating matters.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +245,What is the company name?,Through human rights supplier verifications we identified gaps both with regards to management system and implementation. We pay particular attention to findings that are considered potential markers of modern-day slavery and collaborate with the suppliers to improve and close the gaps. ,Devon,NYSE_DVN_2018.pdf,[6],0.0,2018,Devon,TEXT,"[""A Delaware corporation formed in 1971 and publicly held since 1988, Devon (NYSE: DVN) is an +independent energy company engaged primarily in the exploration, development and production of oil, natural gas +and NGLs. Our operations are concentrated in various North American onshore areas in the U.S. and Canada. In +July 2018, we exited the midstream business by divesting our aggregate ownership interests in EnLink and the +General Partner.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +246,What is the company name?,"Today, the oil and gas industry is transforming at a pace not seen in recent history, and DCP Midstream is proud to be leading the way through our talented people, optimized processes, and innovative technologies. As we look beyond the horizon, our strategic approach to ensuring long-term stakeholder value can be narrowed to two core areas of focus: operational excellence and sustainability.",DCP Midstream,DCP-Sustainability-ReportQ120.pdf,[3],0.0,2019,DCP Midstream,TEXT,"[""Today, the oil and gas industry is +transforming at a pace not seen in +recent history, and DCP Midstream is +proud to be leading the way through our +talented people, optimized processes, +and innovative technologies. As we +look beyond the horizon, our strategic +approach to ensuring long-term +stakeholder value can be narrowed to +two core areas of focus: operational +excellence and sustainability.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +247,What is the company name?,"Together with partners we sanctioned and submitted the Plan of Development for Hywind Tampen to the authorities. This is a project that uses floating wind turbines to generate renewable electricity to supply two oil and gas fields in the Tampen area: Snorre and Gullfaks. Once completed, around 35% of the annual power demand from the five platforms in the area will be met by a floating offshore wind farm. Emissions from the Gullfaks and Snorre fields will be reduced by more than 200,000 tonnes per year. ",Approach Resources Inc,NASDAQ_AREX_2018 annual.pdf,[7],0.0,2018,Approach Resources Inc.,TEXT,"[""Approach Resources Inc. is an independent energy company focused on the exploration, development, +production and acquisition of unconventional oil and gas reserves in the Midland Basin of the greater Permian Basin +in West Texas, where we lease approximately 150,000 net acres as of December 31, 2018. We believe our +concentrated acreage position and extensive, integrated field infrastructure system provide us an opportunity to +achieve cost, operating and recovery efficiencies in the development of our drilling inventory. Our long-term +business strategy is to develop resource potential from the Wolfcamp shale oil formation and pursue acquisitions +that meet our strategic and financial objectives. See """"” Our Business Strategy"" below. Additional drilling targets +could include the Clearfork, Canyon Sands, Strawn and Ellenburger zones. We sometimes refer to our development +project in the Permian Basin as ""Project Pangea,"" which includes ""Pangea West."" Our management and technical +team have a proven track record of finding and developing reserves through advanced drilling and completion +techniques. As the operator of all of our estimated proved reserves and production, we have a high degree of control +over capital expenditures and other operating matters.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +248,What is the company name?,"Total scope one emissions of CO₂ (kg CO₂) from exploration and production, divided by total production (boe).",NTPC Limited,NTPC Limited-Report-FY-19.pdf,[6],0.0,2019,"NTPC +Limited",TEXT,"[""The sustainability report of NTPC +Limited is in accordance with Global +Reporting Initiative (GRI) Standards +""Comprehensive"" option and +incorporates the IIRC framework for +the period April 1, 2018 to March +31, 2019. NTPC has defined its +capitals and attempted to provide an +overview of how it creates value for its +stakeholders for FY19. The last +sustainability report FY18 was +released on February 13, 2019. All +reports are available on the +company's website http:// ntpc.co. +in/en/sustainability /reportsand- +policies. NTPC follows +financial year reporting period for +Sustainability Report.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +249,What is the company name?,Transocean Sustainability Report 2017/2018,Transocean Ltd,Transocean_Sustain_digital_FN_4 2017_2018.pdf,[1],0.0,2017/2018,Transocean,TEXT,"[""Transocean Sustainability Report 2017/2018""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +250,What is the company name?,"UK The Equinor operated offshore wind farms Sheringham Shoal, Dudgeon and Hywind Scotland are supporting local communities through community funds or local educational initiatives and sponsorships.",AGL Energy Ltd,AGL Energy Ltd FY19 Carbon Scenario Analysis.pdf,[1],0.0,2019,AGL,TEXT,"[""agl""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +251,What is the company name?,"Unintentional spills of chemicals, produced water, ballast water and polluted water reaching the natural environment.",Chesapeake energy,Chesapeake 2017 Annual Report.pdf,[1],0.0,2017,Chesapeake energy,TEXT,"[""Chesapeake energy""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +252,What is the company name?,"Urgent need for action Climate change is one of the main challenges of our time and a clear call for action. Equinor acknowledges the findings of the Intergovernmental Panel on Climate Change (IPCC) that human activities contribute to global warming with detrimental effects on nature, people and society at large. We recognise that the world's energy systems must be transformed in a profound way to drive decarbonisation, while at the same time ensuring universal access to affordable and clean energy and realising the United Nations Sustainable Development Goals. We want to be an active player in this change by reducing emissions, growing in renewable energy and providing low carbon solutions to our customers to help accelerate decarbonisation. According to IPCC’s 1.5 C report from 2018 and the two IPCC special reports from 2019 on land and on the ocean and cryosphere in a changing climate, global temperature rise has already reached 1C above the pre-industrial level. Global warming is damaging the ability of the land and the ocean to sustain humanity. To avoid an irreversible climate crisis, global warming needs to be kept to well below 2C and urgent actions are needed to reduce greenhouse gas emissions from all sectors.",OMV,Sustainability Report 2015_EN.pdf,[2],0.0,2015,OMV Group,TEXT,"[""About this report This report covers the sustainability operations of OMV Group, headquartered in Vienna, Austria, for the 2015 business year.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +253,What is the company name?,"VIETNAM ELECTRICITY 11 Cua Bac street, Ba Dinh district, Hanoi, Vietnam Website: http://www.evn.com.vn Telephone: 024.66946789 | Fax: 024.66946666",EVN,Vietnam Electricity Corporation (EVN)_AnnualReport2018(1).pdf,[46],0.0,2018,Vietnam Electricity,TEXT,"[""VIETNAM ELECTRICITY 11 Cua Bac street, Ba Dinh district, Hanoi, Vietnam Website: http://www.evn.com.vn Telephone: 024.66946789 | Fax: 024.66946666""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +254,What is the company name?,We aim to increase our equity renewable capacity ten-fold from 2019 to 2026.,Aker BP,Aker-BP-Sustainability-report-2017.pdf,[1],0.0,2017,Aker BP,TEXT,"[""AKER BP ASA""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +255,What is the company name?,"We believe that our strategy and long-term perspective on value creation will make us more competitive in the long term. Our values open, collaborative, courageous and caring help us set direction and guide our decisions, actions, and the way we interact with others. ",Transneft PJSC,annual 2018.pdf,[1],0.0,2018,Transneft,TEXT,"[""TRANSNEFT""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +256,What is the company name?,We create shared value that contributes to sustainable development through:,Cabot Oil & Gas Corp,Cabot Oil & Gas Corp Annual Report 2016.pdf,[1],0.0,2016,CABOT OIL & GAS CORPORATION,TEXT,"[""CABOT OIL & GAS CORPORATION""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +257,What is the company name?,"We follow rigorous technical and operational standards for well design and operations, including standards for the types and volumes of chemicals used in drilling and hydraulic fracturing fluids. We disclose the chemicals used in hydraulic fracturing through FracFocus1.",OMV,Sustainability Report 2017_EN.pdf,[2],0.0,2017,OMV Group,TEXT,"[""About this report This report covers the operations of OMV Group, headquartered in Vienna, Austria, for the 2017 business year.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +258,What is the company name?,"We recognise that our efforts in this space is a continuous journey of improvement. As such, the human rights improvement project conducted an analysis during 2019 to explore how we can ensure ongoing improvement of identification and engagement with potentially affected stakeholders, paying attention to our activities in, amongst others, Argentina, Nicaragua and Mexico.",Cenovus Energy,Cenovus Annual Report 2014.pdf,[1],0.0,2014,Cenovus Energy,TEXT,"[""cenovus ENERGY""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +259,What is the company name?,"We see from post-course feedback that attendees consider these training sessions to increase specific awareness of human rights issues related to their work, leading to changed behaviours when assessing risks, following up on issues, and ensuring that human rights is included when scoping work. ",DCP Midstream,DCP-Sustainability-ReportQ120.pdf,[3],0.0,2019,DCP Midstream,TEXT,"[""Today, the oil and gas industry is +transforming at a pace not seen in +recent history, and DCP Midstream is +proud to be leading the way through our +talented people, optimized processes, +and innovative technologies. As we +look beyond the horizon, our strategic +approach to ensuring long-term +stakeholder value can be narrowed to +two core areas of focus: operational +excellence and sustainability.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +260,What is the company name?,"Welcome to Apache's 2017 sustainability report. To view the report online, please visit the Apache website at www.apachecorp.com/sustainability",Apache,2017_SustainabilityReport_2_9_Web.pdf,[5],0.0,2017,Apache,TEXT,"[""Welcome to Apache's 2017 sustainability report. +To view the report online, please visit the Apache +website at www.apachecorp.com/sustainability""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +261,What is the company name?,Welcome to OMV's 2018 Sustainability Report,OMV,dload_Sustainability Report 2018_en.pdf,[2],0.0,2018,OMV,TEXT,"[""Welcome to OMV's 2018 Sustainability Report""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +262,What is the company name?,Welcome to the University of Plymouth's fifth Sustainability Report,University of Portsmouth,University of Plymouth Sustainability_Report_2018.pdf,[3],0.0,2018,University of Plymouth,TEXT,"[""Welcome to the University of Plymouth's fifth Sustainability Report""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +263,What is the company name?,"While the Chinese power industry is facing imminent challenges, opportunities also arise. In 2018, CR Power actively responded to changes caused by power reform and industrial transformation, accelerated the development of renewable energy, disposed of inefficient assets, and actively promoted business innovation and transformation.",CR Power,China Resources Power Holdings Co Ltd Annual Report 2018.pdf,[13],0.0,2018,CR Power,TEXT,"[""While the Chinese power industry is facing imminent challenges, +opportunities also arise. In 2018, CR Power actively responded to +changes caused by power reform and industrial transformation, +accelerated the development of renewable energy, disposed of +inefficient assets, and actively promoted business innovation and +transformation.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +264,What is the company name?,"Xcel Energy achieved its earnings target once again in 2019, marking the 15th consecutive year of meeting or exceeding our earnings guidance.",XCEL,Xcel_Energy-AR2019.pdf,[2],0.0,2019,Xcel Energy,TEXT,"[""Xcel Energy achieved its earnings target once again in 2019, marking the 15th consecutive year of meeting or exceeding our earnings guidance.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +265,What is the company name?,Xcel Energy is a major U.S. electric and natural gas company with annual revenues of $11.5 billion.,XCEL,Xcel_Energy-AR2019.pdf,[3],0.0,2019,Xcel Energy,TEXT,"[""Xcel Energy is a major U.S. electric and natural gas company with annual revenues of $11.5 billion.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +266,What is the company name?,"Xcel Energy is a major U.S. regulated electric and natural gas delivery company headquartered in Minneapolis, Minnesota (incorporated in Minnesota in 1909).",XCEL,Xcel_Energy-AR2019.pdf,[22],0.0,2019,Xcel Energy,TEXT,"[""Xcel Energy is a major U.S. regulated electric and natural gas delivery company headquartered in Minneapolis, Minnesota (incorporated in Minnesota in 1909).""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +267,What is the company name?,agl,AGL Energy Ltd,AGL Energy Ltd Annual Report 2019.pdf,[1],0.0,2019,AGL,TEXT,"[""agl""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +268,What is the company name?,"but we must strive to be always safe and will increase our efforts going forward. In particular, the follow up of compliance with Life-Saving Rules will be strengthened. ",Enel,Enel SA sustainability-report-2017.pdf,[5],0.0,2017,Enel,TEXT,"[""In defining and implementing its strategic vision, Enel carefully integrates and combines all relevant factors: economic-financial, environmental, social and governance-related.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +269,What is the company name?,cenovus ENERGY,Cenovus Energy,Cenovus Annual Report 2019.pdf,[1],0.0,2019,Cenovus Energy,TEXT,"[""cenovus ENERGY""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +270,What is the company name?,cenovus energy 2012 annual report,Cenovus Energy,Cenovus Annual Report 2012.pdf,[1],0.0,2012,cenovus ENERGY,TEXT,"[""cenovus energy 2012 annual report""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +271,What is the company name?,climate-related risks and opportunities in line with its strategy and risk management process. ,NOVATEK,04_NOVATEK_AR_2018_ENG_15.pdf,[1],0.0,2018,PAO NOVATEK,TEXT,"[""PAO NOVATEK ANNUAL REPORT 2018""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +272,What is the company name?,"environments, Resource management (waste and water), Biodiversity and sensitive areas",Cenovus Energy,Cenovus Sustainability Report 2017.pdf,[1],0.0,2017,Cenovus Energy,TEXT,"[""cenovus ENERGY""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +273,What is the company name?,"for polar bears, density modelling of whales and dolphins, distribution modelling of bird species and studies to increase our general knowledge on ice edge ecosystems. Offshore wind – UK and USA Equinor’s Empire Wind offshore wind project, currently under development, has engaged in a pioneering partnership with conservation scientists to protect the endangered North Atlantic right whale. The collaboration with the Wildlife Conservation Society has deployed two high-tech whale monitoring equipment in the lease area. The real-time monitoring tool will be an effective way to detect large whale species during construction activities and will also provide scientists with significantly more spatial and temporal distribution data, which will be helpful to identify the best way to protect the species.",Approach Resources Inc,NASDAQ_AREX_2016 annual.pdf,[8],0.0,2016,Approach Resources Inc.,TEXT,"[""Approach Resources Inc. is an independent energy company focused on the exploration, development, +production and acquisition of unconventional oil and gas reserves in the Midland Basin of the greater Permian Basin +in West Texas, where we lease approximately 123,000 net acres as of December 31, 2016. We believe our +concentrated acreage position and extensive, integrated field infrastructure system provides us an opportunity to +achieve cost, operating and recovery efficiencies in the development of our drilling inventory. Our long-term +business strategy is to develop resource potential from the Wolfcamp shale oil formation and pursue acquisitions +that meet our strategic and financial objectives. See """"” Our Business Strategy"" below. Additional drilling targets +could include the Clearfork, Canyon Sands, Strawn and Ellenburger zones. We sometimes refer to our development +project in the Permian Basin as ""Project Pangea,"" which includes ""Pangea West."" Our management and technical +team have a proven track record of finding and developing reserves through advanced drilling and completion +techniques. As the operator of all of our estimated proved reserves and production, we have a high degree of control +over capital expenditures and other operating matters.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +274,What is the company name?,including a review of the consistency of information against the GRI index.,Cabot Oil & Gas Corp,Cabot Oil & Gas Corp Annual Report 2017.pdf,[1],0.0,2017,CABOT OIL & GAS CORPORATION,TEXT,"[""CABOT OIL & GAS CORPORATION +2017 Annual Report""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +275,What is the company name?,interaction between the protected areas and these assets. ,AES Corporation ,AES Corporation Annual Report 2018.pdf,[1],0.0,2018,THE AES CORPORATION,TEXT,"[""THE AES CORPORATION""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +276,What is the company name?,local job creation and local sourcing of goods and services,RWE,RWE-csr_overall-report-2019.pdf,[36],0.0,2019,RWE Aktiengesellschaft,TEXT,"[""RWE Aktiengesellschaft""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +277,What is the company name?,"nmVOC released to the atmosphere from power generation and heat production, flaring (including well testing/well work-over), process, cold venting and fugitives.",Eni SpA,EniFor-2018-eng.pdf,[6],0.0,2018,Eni,TEXT,"[""ENI IN THE WORLD""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +278,What is the company name?,"opportunity areas are: Competitive at all times, Transforming the oil and gas industry, and Providing energy for a low carbon future. ",PGE,PGE_Mngmnt_Board_consolidated_report_PGE_CG_2018_with comments.pdf,[7],0.0,2018,PGE Group,TEXT,"[""PGE Group as of the end of 2018 consisted of: ï‚¡ PGE S.A. - the parent company, ï‚¡ 57 subsidiaries subject to consolidation, ï‚¡ 4 associates, ï‚¡ 1 jointly controlled entity.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +279,What is the company name?,"over many years. Our workforce is also exposed to risk factors such as noise and chemicals, these areas are followed up in our daily work and through continuous improvement efforts. ",BASF SE,BASF_Report_2016.pdf,[1],0.0,2016,BASF,TEXT,"[""BASF Report 2016""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +280,What is the company name?,"saipem SpA Via Martiri di Cefalonia, 67 20097 San Donato Milanese Milan - Italy",Saipem SpA,SaipemSustainability2018.pdf,[72],0.0,2018,saipem SpA,TEXT,"[""saipem SpA +Via Martiri di Cefalonia, 67 +20097 San Donato Milanese +Milan - Italy""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +281,What is the company name?,scale-up of investment in sustainable natural carbon sinks. ,Tatneft,PJSC Tatneft annual report 2016.pdf,[4],0.0,2016,TAFTNEFT,TEXT,"[""The PJSC TATNEFT's securities are listed in the Russian and international stock markets. +The Company's ordinary and preferred shares are traded on the Moscow Stock Exchange +and are quoted on the highest list of the first (I) level. 28.5% of the voting shares were +deposited to be converted to global American Depository Receipts (ADR). The Company's +depositary receipts are included in the listing of the London Stock Exchange (ATAD).""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +282,What is the company name?,"sea is closely monitored to ensure it stays within regulatory limits. In some cases, especially during periods of varying process conditions, produced water is dispatched together with crude oil through pipelines to onshore plants for treatment. Improved work processes and an IT tool for water management have been implemented.",Adani,Adani Group Adani Enterprises Annual Report 2019.pdf,[1],0.0,2018-19,Adani Enterprises Limited,TEXT,"[""Adani Enterprises Limited""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +283,What is the company name?,"to discuss concerns with their leader or the leader’s superior or use available internal channels to provide support. Concerns may also be reported through our Ethics Helpline. The helpline allows for anonymous reporting and is open to employees, business partners and the general public. Equinor has a strict non-retaliation policy.",CenterPoint Energy,CenterPoint Energy Annual report 2012.pdf,[1],0.0,2012,CenterPoint Energy,TEXT,"[""CenterPoint Energy""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +284,What is the company name?,tonnes of gas flared per1000 tonnes of hydro- carbon produced,Teekay Corp,Teekay-Corporation-2018-Sustainability-Report.pdf,[1],0.0,2018,TEEKAY CORPORATION,TEXT,"[""TEEKAY CORPORATION +2018 Sustainability Report""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +285,What is the company name?,"us. Equinor has low carbon as one of the main strategic pillars on which the governance of the company is based, and we embed climate considerations into decision making, sensitivity testing, incentives and reporting. ",ROMGAZ,Annual Report 2016_0.pdf,[1],0.0,2016,"Societatea Nationala de Gaze Naturale ""ROMGAZ"" SA ",TEXT,"[""Societatea Nationala de Gaze Naturale ""ROMGAZ"" SA Board of Director's Report 2016""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +286,What is the company name?,value creation and portfolio optimisation through valuable partnerships. ,XCEL,Xcel_Energy-AR2019.pdf,[3],0.0,2019,Xcel Energy,TEXT,"[""Xcel Energy is a major U.S. electric and natural gas company with annual revenues of $11.5 billion.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +287,What is the company name?,"were within or near the terminal area. The free oil at and around the terminal has been collected. Clean-up continues in forest areas north-east of the terminal, closely monitored by environmental experts. There have been no confirmed observations of oil on sea water coming from the oil spill. Tests of groundwater from monitoring wells on site in November 2019 show no contamination from the oil spill. Groundwater sampling events will be completed on a quarterly basis throughout 2020.",NOVATEK,04_NOVATEK_AR_2016_ENG_11.pdf,[3],0.0,2016,NOVATEK,TEXT,"[""About the Company NOVATEK is one of the largest independent natural gas producers in Russia""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +288,What is the company name?,wintershall dea,Wintershall Dea,Wintershall Dea annual report 2019.pdf,[1],0.0,2019,Wintershall Dea,TEXT,"[""wintershall dea""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,1 +289,What is the company name?,• AR 3.10 – Risk management and internal control • SR – Embedding sustainability in how we work • SR – Climate-related business risks and portfolio resilience ,Gazprom PJSC,gazprom-annual-report-2018-en.pdf,[1],0.0,2018,PJSC GAZPROM,TEXT,"[""PJSC Gazprom Annual Report 2018""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +290,What is the company name?,"• Capture value from cycles: We have demonstrated in the past the ability to create value through the cycles, by adding resources in downturns and optimising the portfolio in upturns. ",PGE,PGE-Presentation_Q42018_EN.pdf,[52],0.0,2019,PGE,TEXT,"[""This presentation has been prepared by the management of PGE Polska Grupa Energetyczna S.A. (the ""Company"" or ""PGE"") and other entities.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +291,What is the company name?,"• Cost competitiveness: We seized the opportunity that arose from the previous downturn to make lasting improvements, and we aim to keep cost levels under control when the prices are increasing. ",Saipem SpA,Annual-report-2019.pdf,[2],0.0,2019,SAIPEM SpA,TEXT,"[""BOARD OF DIRECTORS AND statutory AUDITORS OF SAIPEM SpA""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +292,What is the company name?,"• Providing access to affordable, reliable, sustainable and modern energy • Creating value for shareholders • • Hiring and developing staff, and promotion of diversity and inclusion in our workforce • Creating opportunities for social and economic development across our value chain through payments to governments, ",CenterPoint Energy,CenterPoint Energy Annual report 2016.pdf,[1],0.0,2016,CenterPoint Energy,TEXT,"[""CenterPoint Energy 2016 Annual Report""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +293,What is the company name?, Confirming agreement of the CO2 reporting for Norway with the preliminary EUETS reporting,Approach Resources Inc,NASDAQ_AREX_2017 annual.pdf,[9],0.0,2017,Approach Resources Inc.,TEXT,"[""Approach Resources Inc. is an independent energy company focused on the exploration, development, +production and acquisition of unconventional oil and gas reserves in the Midland Basin of the greater Permian Basin +in West Texas, where we lease approximately 149,000 net acres as of December 31, 2017. We believe our +concentrated acreage position and extensive, integrated field infrastructure system provides us an opportunity to +achieve cost, operating and recovery efficiencies in the development of our drilling inventory. Our long-term +business strategy is to develop resource potential from the Wolfcamp shale oil formation and pursue acquisitions +that meet our strategic and financial objectives. See “— Our Business Strategy” below. Additional drilling targets +could include the Clearfork, Canyon Sands, Strawn and Ellenburger zones. We sometimes refer to our development +project in the Permian Basin as “Project Pangea,” which includes “Pangea West.” Our management and technical +team have a proven track record of finding and developing reserves through advanced drilling and completion +techniques. As the operator of all of our estimated proved reserves and production, we have a high degree of control +over capital expenditures and other operating matters.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 +294,What is the company name?, One physical site visits and in-depth interviews with three Equinor locations in order to gather and review,Canadian Natural Resources Ltd,Canadian Natural Resources Annual Report 2018.pdf,[2],0.0,2018,Canadian Natural,TEXT,"[""Canadian Natural 2018 Annual Report Premium Value. Defined Growth. Independent.""]",20201030 1Qbit aggregated_annotations_needs_correction.xlsx,0 diff --git a/data/extraction/sustainability-report-2019.json b/data/extraction/sustainability-report-2019.json new file mode 100644 index 0000000..c76b847 --- /dev/null +++ b/data/extraction/sustainability-report-2019.json @@ -0,0 +1 @@ +{"1": ["to invest in the protection of tropical forests and develop a ", "mechanism to tap into the important and effective abilities of ", "natural sinks to absorb CO\u2082 from the atmosphere. ", "The global energy transition creates new business ", "opportunities. Decades of offshore experience and innovative ", "solutions enable Equinor to capture those opportunities in the ", "offshore wind area. Last year, Equinor prepared the ground for ", "substantially scaling up investments in offshore wind. Together ", "with our partner SSE, we were awarded contracts to build the ", "world\u2019s largest offshore wind farm in the Dogger Bank area ", "of the North Sea. Equinor was also awarded the contract to ", "Equinor supports the Paris agreement and a net zero target ", "develop the Empire Wind farm offshore New York in the Atlantic ", "for society. We have already brought CO\u2082 emissions in the oil ", "Ocean. Meanwhile, the pioneering Hywind Tampen project, ", "and gas production process down to industry leading levels, ", "providing electricity to five offshore platforms at the Gullfaks ", "and we will continue to do more. Our journey to develop as a ", "and Snorre fields on the NCS, passed an important milestone as ", "broad energy company is founded on a strong commitment to ", "Equinor and partners reached a final investment decision and ", "sustainability, and our strategy \u2013 always safe, high value and ", "awarded five major contracts. Equinor is positioning itself to be ", "low carbon \u2013 is applied in everything we do. ", "The safety and security of our people, and integrity of our ", "Equinor is a values-based company. How we deliver is equally ", "operations, is our top priority. I am pleased to see improvement ", "important as what we deliver. We recognise that we can only ", "in important areas, although we will need to work even harder ", "retain our social license to operate by conducting responsible ", "to avoid major accidents, intensify efforts related to near-", "operations. This starts with managing our environmental ", "misses and further reduce personnel injuries.", "impact, including on oceans. As a founding patron of the UNGC ", "We acknowledge climate science and have embedded climate ", "urgency and global importance of healthy oceans. Increasing ", "considerations into our business strategy and decision-making ", "awareness and corresponding action towards preserving ", "process. In 2019, Equinor, together with investors participating ", "ocean environments is one of the company\u2019s sustainability ", "for Sustainable Ocean Principles, Equinor addresses the ", "in Climate Action 100+, announced new steps to further ", "demonstrate industry leadership and support for the goals ", "of the Paris Agreement. We have launched a new climate ", "How we treat and protect people is essential for responsible ", "roadmap and set ambitions beyond 2030, performed a tougher sensitivity test of our portfolio, and disclosed climate-related ", "operations. Equinor already has human rights principles ", "embedded in both our corporate values and the Code ", "risks in line with the TCFD recommendations. ", "of Conduct, but we strive to continuously improve and ", "systematically further integrate human rights into the way we ", "2019 marked the start-up of Johan Sverdrup \u2013 the largest ", "conduct business. Our commitment is to make our best efforts, ", "development on the Norwegian continental shelf since the ", "so that human rights are respected across the entire Equinor, ", "1980s \u2013 ahead of schedule and well below the original cost ", "including our employees, the people affected by our operations ", "estimates. Johan Sverdrup is a frontrunner in the fit-for-future ", "and partnerships, as well as throughout our supply chains.", "portfolio Equinor is building, to create long-term sustainable ", "value for our society. The field has a record low carbon intensity, ", "For almost 50 years, Equinor has dedicated itself to our ", "purpose of turning natural resources into energy for people ", "Our efforts do not stop at curtailing our own emissions. We take ", "and guided by the United Nation\u2019s Sustainable Development ", "an active role in helping society to accelerate decarbonisation ", "Goals, and we are committed to long-term sustainable value ", "and progress for society. Our actions will continue to be inspired ", "through close collaboration with industry players, customers, ", "and governments. Examples include hydrogen developments ", "and the Northern Lights project, which aims at developing a ", "President and Chief Executive Officer ", "carbon capture and storage value chain. We are prepared ", "Low carbon - Creating a low-carbon advantage", "Always safe - Responsible operations Protecting people", "Promoting integrity and transparency", "Appendices Definitions and abbreviations", "Task Force on Climate-related Financial Disclosures (TCFD) reference index", "Equinor is partnering with SSE Renewables to deliver ", "Our record-breaking Johan Sverdrup field came on ", "Dogger Bank \u2013 the world\u2019s largest offshore wind farm and ", "stream in October 2019 and is already producing ", "an important milestone in the UK\u2019s transition to renewable ", "more than 350,000 barrels per day. It is powered ", "energy. Once complete, Dogger Bank is expected to ", "produce enough power for 4.5 million British homes.", "by electricity from shore, making it one of the most ", "Equinor Sustainability report 2019Introduction"], "2": ["We are Equinor, an international energy company with a proud history. With more than 21,000 committed colleagues developing oil, gas, wind and solar energy, we are present in more than 30 countries worldwide. We are the largest operator in Norway, among the world\u2019s largest offshore operators, and a growing force in renewables. ", "Reporting standards This report has been prepared in accordance with the Global Reporting Initiative (GRI) Standards: Core option. A GRI Index is available at equinor.com. The sustainability report should be read in conjunction with the GRI index. We view this report to be our Communication on Progress to the UN Global Compact (advanced reporting level). ", "We also use reporting guidance from IPIECA, the global oil and gas industry association for environmental and social issues, and recommendations from the Task Force on Climate-related Financial Disclosures. ", "Assurance This report has been externally assured by EY, with reasonable level of assurance for selected climate, environment and safety indicators, and a limited level of assurance for the rest of the report, excluding forward looking information. The independent assurance statement, as listed in appendix, concludes that the report is presented in all material respects, in accordance with the GRI Standards: Core option. ", "Reporting boundaries Defining consistent boundaries for sustainability reporting is challenging due to the complexity of ownership and operational arrangements, such as joint operating agreements. We strive to be consistent and transparent about variations in boundaries and provide a complete report in line with industry practice.", "\u2022 Environmental data is, unless otherwise stated, reported on a 100% basis for our operated assets, facilities and vessels, including subsidiaries and operations where we are the technical service provider, and for contracted drilling rigs and flotels (operational control basis). ", "\u2022 Scope 1 CO\u2082 emissions are reported both on an operational control basis and on equity basis (financial ", "\u2022 Scope 3 greenhouse gas emissions are reported on the basis of equity (volumes of products sold). \u2022 Health and safety incident data is reported for our operated assets, facilities and vessels, including subsidiaries and operations where we are the technical service provider. These include contracted drilling rigs, floatels, vessels, projects and modifications, and transportation of personnel and products, using a risk-based approach.", "\u2022 Economic data is reported on an equity basis, unless otherwise stated. \u2022 Workforce data covers employees in our direct employment. Temporary employees are not included. \u2022 Human rights and social performance data are collected from assets under our operational control.", "Assets acquired or disposed of during the year are included for the period in which we owned them, unless otherwise stated. Entities that we do not control, but have significant influence over, are included in the form of disclosures of management approach. The report does not include data from equity interest fields/projects, such as joint ventures, where we are not operator. Exceptions are for climate data or where specified. ", "Restatements Historic numbers are sometimes adjusted due to for example changes in reporting principles, changes of calculation factors used by authorities, or re-classification of incidents after investigations. We restate historic numbers and explain the changes if the adjustment represents a change of minimum 5% for indicators with reasonable level of assurance, and 10% for indicators with limited level of assurance. ", "Per day oil and gas equity production", "Renewable energy equity production", "2019 Serious incident frequency (SIF - per million hours worked)", "2019 CO2 intensity for the upstream oil and gas portfolio (operated 100%, kg CO\u2082/boe)", "We energize the lives of 170 million people. Every day."], "3": ["Material topics and stakeholder dialogue", "This report focuses on the sustainability topics that were most significant to us and our stakeholders in 2019. ", "The material topics have been selected and prioritised through a systematic process based on the reporting principles in the GRI Standards. Our material topics are defined as those that have or may have a significant impact on our stakeholders and on Equinor. ", "Stakeholder dialogue is an important part of the content selection process. We conduct our business in continuous engagement with our key stakeholders throughout the year. Stakeholder dialogue is undertaken by amongst others the chairman of the board, the CEO and other senior managers. Key stakeholder groups include employees, shareholders, governments, business partners and suppliers, customers, and society at large, including non- governmental organisations and academia. An overview of our key stakeholder groups and prioritised issues is available at Equinor.com. Regular dialogue, media analysis, investor roadshows and other stakeholder outreach with ", "key stakeholders on sustainability topics, have helped capture the stakeholder views and concerns most relevant for this report.", "Throughout the year, we have also engaged in dialogue with the investor group Climate Action 100+, and in April 2019 we published a joint statement with this group. The commitments are further addressed in the report and the statement is available at Equinor.com.", "When assessing the impact on stakeholders, we considered the global sustainability context, transparency and relevant reporting standards. ", "To assess the importance of various sustainability topics to Equinor, we reviewed our business strategy, sustainability priorities and business risks. We engaged our business areas to capture views from different parts of the business. ", "Our material topics have remained, to a large extent, consistent over the last three years. ", "Climate change and the energy transition: Business strategy, GHG emissions, New energy solutions, Low carbon research and development ", "Creating shared value: Economic and social impact, Local procurement, Employment, People development, Innovation and research and development activities", "Responsible operations: \u2022 Safety and security: Personnel safety, Emergency ", "preparedness, Health and working environment, Security and cyber security", "\u2022 Environmental impact: Emissions and discharges to local ", "environments, Resource management (waste and water), Biodiversity and sensitive areas", "\u2022 Ethics and anti-corruption: Revenue and tax transparency, ", "\u2022 Human rights: Labour rights and working conditions ", "(employees and supply chain), Diversity and inclusion, Human rights in communities and security arrangements. ", "Other reports The following Equinor reports provide additional information about our business activities and impacts: \u2022 Annual report and Form 20-F, including Payments to ", "Sustainability performance data Performance data in this report and supplementary data are presented online at sustainability.equinor.com.", "governments report \u2022 CDP 2019 response \u2022 Global Reporting Initiative (GRI) index 2019 \u2022 Energy Perspectives 2019", "Feedback We welcome your feedback. Please use the e-mail and social media channels linked below for comments and questions. ", "Equinor.com For further information about sustainability at Equinor, visit our web pages and follow us on social media."], "4": ["The world needs energy providers that can deliver energy with lower emissions", "Our purpose To turn natural resources into energy for people and progress for society. ", "Low carbon Creating a low-carbon business advantage Industry leader in carbon efficiency ", "Our sustainability priority areas reflect our main contributions to, and impact on society and entail significant business risks and opportunities.", "Always safe Responsible operations Safety is our first priority ", "Respect human rights and promote integrity", "Sustainability is embedded in Equinor's: ", "Equinor\u2019s purpose is to turn natural resources into energy for people and progress for society. Our strategy \u2013 always safe, high value and low carbon \u2013 positions us to deliver long-term value in a low carbon future. This is reflected in our vision: Shaping the future of energy. We are developing from an oil and gas company to a broader energy company. Our three sustainability priorities \u2013 responsible operations, creating a low-carbon business advantage, and creating shared value \u2013 are embedded in our strategy. ", "Always safe: Safe and responsible operations are essential for our license to operate and an enabler of long-term value creation. We have set clear targets for continuous improvement of our safety records. Responsible operations include managing our environmental impact, respecting human rights and promoting integrity and transparency. ", "High value: We deliver energy to millions of people and create value for our shareholders. Through our core business and supply chain, we create economic value and opportunities for society and communities. We provide jobs and develop capabilities among our own employees and beyond our company. ", "Low carbon: To thrive in the energy transition, we aim to maintain our position as one of the industry leaders in carbon efficient oil and gas production, grow in new energy solutions and step up helping accelerating decarbonization of society. ", "We believe that our strategy and long-term perspective on value creation will make us more competitive in the long term. Our values open, collaborative, courageous and caring help us set direction and guide our decisions, actions, and the way we interact with others. ", "Our contribution to the UN Sustainable Development Goals Equinor supports the UN Sustainable Development Goals (SDGs) and shares the view that business has a key role to play in the implementation of the goals. Our main contribution to society is the energy we deliver, the economic value and jobs we create, the people we develop, our efforts to reduce greenhouse gas emissions, and pursuing safe and responsible operations. ", "We recognise that our business activities may have both positive and negative impacts on the SDGs. Our impact spans across the 17 goals, however we believe that our actions have most impact on the six SDGs highlighted in the overview table on the next page. ", "High value Creating shared value Provide energy and create value for shareholders ", "Create economic value and opportunities for society and communities ", "Develop people and promote diversity and inclusion", "Our business contributes to the Sustainable Development Goals. We believe in transparency and collaboration for greater impact .", "Equinor Sustainability report 2019Sustainability at EquinorEquinor Sustainability report 2019 Sustainability at Equinor"], "5": ["Sustainability ambitions, performance and impact on the SDGs", "Implemented the Safety beyond 2020 improvement programme ", "SIF: Serious Incident Frequency (per million hours worked)", "TRIF: Total Recordable Injury Frequency (per million hours worked).", "Oil and gas leakages (number of, leakage rate >0.1 kg per second) ", "Share of production in water scarce areas (%)", "Signed up to UN Global Compact's Sustainable Oceans Principles", "Always safe - Responsible operations", "Developed and implemented a company-wide human rights action plan", "Supplier human rights verifications conducted (number of)", "To be an industry leader in safety and security", "Enhanced collaboration with our suppliers", "Improve learning and assurance processes", "Improve sustainable management approach of oceans and biodiversity", "Implementing Equinor human rights project ambitions ", "Respect human rights as an employer, business partner and buyer", "Improved the anti-corruption risk management and monitoring process ", "Increased targeted trainings appropriate to the nature and location of the employees", "Implemented new strategy for diversity and inclusion Started up 6 fields, including Johan Sverdrup generating annually 2,700 manyears Successful bid for Empire Wind, with total investments of USD3 billion. Will power over 500,000 homes in New York.", "Developed new business models to produce renewable energy from Hywind Tampen to power oil & gas production", "Promoting integrity and transparency", "Percentage of employees completed the code of conduct course (%)", "Develop and implement a plan for strengthening compliance capability and ethics culture", "Purchase of goods and services (bnUSD) ", "Implementing Equinor shared value project ambitions ", "Our ambition is that all teams are diverse and inclusive by 2025", "Developed, anchored and published a strengthened climate roadmap", "Annual CO\u2082 emissions reductions (ktonnes)", "CO\u2082 intensity for the upstream oil and gas portfolio (kg CO\u2082/boe)", "Low carbon R&D expenditure in share of total (%)", "Investments in new energy solutions in share of total (%)", "Upstream portfolio carbon intensity of below 8kg CO\u2082/boe by 2025", "Norway: 40 % reduction in absolute CO\u2082 emissions by 2030 Equinor renewable equity generation capacity expected to increase ten-fold from 2019 to 2026 to 4-6GW ", "Reducing net carbon intensity by at least 50% by 2050", "Equinor Sustainability report 2019Sustainability at EquinorEquinor Sustainability report 2019 Sustainability at Equinor"], "6": ["Embedding sustainability in how we work ", "Our management approach: Sustainability governance and performance framework At Equinor, our approach to sustainability is embedded in how we work. This includes our corporate governance principles, performance and reward framework and management system. ", "The business line is accountable for executing the company\u2019s sustainability ambitions and for managing relevant risks and performance. Dedicated safety, security and sustainability staff in the business line is part of company-wide functional networks and provides advice and support to the business line. ", "Governance The Equinor ASA board of directors (BoD) and corporate executive committee regularly review, monitor and discuss sustainability issues. This includes climate-related business risks and opportunities, and sustainability aspects of investment decisions. The BoD members are elected by the shareholders. In addition, there are employee-elected representatives as required by Norwegian law.", "The BoD safety, sustainability and ethics committee assists the BoD in its supervision of the company\u2019s safety, security, sustainability and ethics policies, systems and principles. This includes quarterly reviews of risk issues and performance and an annual review of the sustainability report. ", "The company has a separate corporate risk committee chaired by the chief financial officer. The committee meets at least three times per year to give advice and make recommendations on Equinor\u2019s enterprise risk management, including climate-related risks.", "Group level functions responsible for sustainability-related issues include safety and security, sustainability, people and leadership and legal. The heads of these functions at group level are responsible for setting strategic direction and reporting on risk and performance within these topics to the corporate executive committee and the BoD, including relevant committees.", "The corporate sustainability function is responsible for overseeing climate change (including climate-related risk), environment, human rights and social issues. The corporate safety function is responsible for safety, health, work environment and security. The chief compliance officer is responsible for business ethics and compliance. ", "Performance and reward framework Management of sustainability performance is integrated in strategy, business planning, risk management, decision- making and management follow-up processes. Our performance framework translates our vision, values and strategy into actions and results. We measure progress and results in a holistic way, using key performance indicators when relevant.", "Safety, security and sustainability management is an integrated part of our management system, which includes our policies, requirements and guidelines for all material topics. Together with our corporate governance principles and performance framework, this forms the basis for how we are embedding these topics in our business activities. The principles and framework are described in the Equinor book, which is approved by the CEO.", "At Equinor climate and sustainability is embedded into our performance and reward framework. The performance evaluation of the CEO and his direct reports is holistic and assessed and rewarded against, among others, both ambitious climate targets (KPIs) and results, and their ability as leaders to be role models for sustainable development and the transition into new energy sources. Equinor\u2019s broader leadership is in the same way assessed and rewarded based on a number of goals including climate and sustainability. Within safety, serious incident frequency (SIF), total recordable injury frequency and oil/gas leakages are key performance indicators which are used to measure performance. Finally, the annual bonus for employees is based on a holistic assessment of company performance which includes, among other areas, CO2 intensity and execution of climate strategies. A comprehensive set of performance indicators and monitoring reports are made available to all employees in our Management Information System (MIS). ", "Sustainability integrated in our governance", "Safety, sustainability and ethics committee", "Compensation and executive development committee", "The effectiveness of our management approach is regularly evaluated through performance reviews at several management levels, including the corporate executive committee, the BoD and the BoD\u2019s safety, sustainability and ethics committee, and by corporate and business area staffs. The frequency and granularity of the performance reviews varies with materiality, frequency of reporting and management level. Internal and external audits, verifications and self-assessments constitute key assurance elements of our management approach. We conduct internal and external benchmarking and participate in external performance ratings for the same purpose. Concerns related to misconduct can be reported to relevant internal entities or to Equinor\u2019s Ethics Helpline which is available to any person. Equinor has developed internal requirements for establishing and running effective operational-level community grievance mechanisms. ", "Risk and impact management Management of sustainability and climate-related risks is embedded in our enterprise risk management process. We identify, evaluate and manage risks to create sustainable value and avoid incidents. Our enterprise risk assessment and related actions are reviewed biannually by the corporate executive committee and the BoD.", "Management of our planned activities shall include development and implementation of cost-efficient measures to avoid, minimise or mitigate adverse environmental and social impacts and risks, in accordance with good international practice and applicable laws and regulations. ", "More information about corporate governance on equinor.com"], "7": ["Some people are still disputing global warming. We\u2019re acting on it.", "Urgent need for action Climate change is one of the main challenges of our time and a clear call for action. Equinor acknowledges the findings of the Intergovernmental Panel on Climate Change (IPCC) that human activities contribute to global warming with detrimental effects on nature, people and society at large. We recognise that the world's energy systems must be transformed in a profound way to drive decarbonisation, while at the same time ensuring universal access to affordable and clean energy and realising the United Nations Sustainable Development Goals. We want to be an active player in this change by reducing emissions, growing in renewable energy and providing low carbon solutions to our customers to help accelerate decarbonisation. According to IPCC\u2019s 1.5 C report from 2018 and the two IPCC special reports from 2019 on land and on the ocean and cryosphere in a changing climate, global temperature rise has already reached 1C above the pre-industrial level. Global warming is damaging the ability of the land and the ocean to sustain humanity. To avoid an irreversible climate crisis, global warming needs to be kept to well below 2C and urgent actions are needed to reduce greenhouse gas emissions from all sectors.", " IPCC (2018): Global Warming of 1.5 C IPCC (2019): Climate Change and Land IPCC (2019): Special Report on the Ocean and Cryosphere in a Changing Climate", "Low carbon \u2014 Creating a low carbon advantage", "Low carbon \u2014 Creating a low carbon advantage"], "8": ["Energy Perspectives The future of energy is uncertain. Equinor\u2019s Energy Perspectives 2019 outlines a wide range of possibilities for the energy markets towards 2050 through three scenarios called Rivalry, Reform and Renewal. In Rivalry, the energy transition is slowed down by geopolitical uncertainty and volatility leading to climate policies receiving less priority. In Reform, market and technology forces drive the energy transition while the current policy momentum continues. Renewal, which is the closest to the International Energy Agency\u2019s (IEA) Sustainability Development scenario, shows a way to limit global warming to well below 2C compared to the pre-industrial level. This requires rapid and significant policy tightening, global cooperation, technology developments and substantial changes in business and consumer behaviour. ", "To reach the goals of the Paris Agreement we need to see a peak in global energy-related greenhouse gas emissions as soon as possible and net zero emissions in the second half of this century. Oil demand in 2050 in the Renewal scenario is about half of today\u2019s level and global gas demand declines by approximately 20%. Even in such a scenario there will be a need to invest in new ", "oil and gas due to natural decline of existing production. The investments needed are however significantly lower in Renewal than in the other scenarios, and oil and gas resources with low costs and low emissions intensity will have an advantage. ", "Natural gas plays an important role in all scenarios and the use of gas for power generation is the main area of growth. In Renewal, gas is a key enabler to phase out coal in the electricity mix and provides a flexible source of electricity generation that can support the uptake of variable renewables. In the mid-2030s, the use of gas needs to be reduced as well, especially in developed regions. ", "Renewable energy is expected to grow significantly in all scenarios, especially in the electricity sector where solar and wind takes on a leading role. In 2018, solar and wind accounted for about 7% of the global electricity mix. This is projected to grow to a share of between 30% to 50% depending on the scenario. The growth in electricity from solar and wind power is driven by technological improvements, reduced cost and continued regulatory support. ", "Climate-related business risks and portfolio resilience ", "Our business needs to be resilient to the multiple risks \u2013 both upside and downside \u2013 posed by climate change. These include potentially stricter climate regulations, changing demand for oil and gas, technologies that could disrupt our market, as well as physical effects of climate change. ", "Governance and risk management Climate-related upside and downside risks, and Equinor\u2019s strategic response to these are discussed frequently by our board of directors and corporate executive committee. In 2019, the board of directors specifically discussed climate-related issues in seven of their eight ordinary board meetings. Climate-related risks were also assessed in relation to specific investment decisions. The board of director\u2019s safety, sustainability and ethics committee discussed climate-related issues in all committee meetings in 2019 ", "Management of climate-related risks is embedded in Equinor\u2019s enterprise risk management process. We use ", "internal carbon pricing, scenario analysis, and sensitivity analysis to assess and manage climate-related risks. We monitor technology developments and changes in policies and regulations and we assess how these might impact the demand for oil, gas and renewable energy, as well as the cost of developing new assets and opportunities for low- carbon technologies.", "Climate-related risk factors are identified by considering main sources of change (i.e., policy, legal, regulatory, market, technology, reputational and physical). Climate- related risk factors are assumed to both indirectly and directly influence Equinor\u2019s cash flow risk via effects on revenues or cost. This relationship is integrated into our risk assessment of revenues and costs and corresponding actions. As an example, climate-related risks could influence oil, gas and carbon price assumptions. Risk adjusting actions are evaluated, decided, and implemented as relevant. An overview of relevant risk factors and how we manage these, is provided below. For more information about governance and risk management, see Sustainability governance and management in this report.", "Our strategic response to climate related risks We acknowledge that an energy transition is ongoing and want to be in the forefront of this change. We believe that the energy transition represents opportunities for ", "Risk factors (upside and downside potential)", "Oil and gas demand Renewable energy demand", "Carbon costs and taxes Specific regulations (e.g. air quality, emission standards and fuel directives)", "Electrification of transport Renewable energy and battery technology CCUS, hydrogen and other low carbon technologies Digitalisation Energy efficiency ", "Scenario analysis and sensitivity testing Climate-related principles in investment decisions and break-even hurdle rates Scaling up investments in renewables and low carbon solutions Cost reduction initiatives ", "Monitoring policy and regulatory development Internal carbon price applied ", "Portfolio sensitivity test Emission reduction measures ", "Scaling up investments in profitable renewables and low carbon solutions Strengthening low carbon R&D Venture funds Digitalisation roadmap Emission reduction measures ", "Chronical effects (e.g. sea water rise, increased scarcity of water) Acute effects (e.g. more frequent and more extreme weather events)", "Regular updates of meteorology and oceanography data used in project design and operational planning ", "Talent attraction and retention Investors\u2019 perception of oil, gas and renewables investments Climate-related litigations License to operate ", "Transparency and disclosures of performance, governance and ambitions External engagement and communication ", "us. Equinor has low carbon as one of the main strategic pillars on which the governance of the company is based, and we embed climate considerations into decision making, sensitivity testing, incentives and reporting. ", "Decision making \u2013 We require all potential projects to be assessed for carbon intensity and address emission reduction opportunities for Equinor-operated projects at every decision phase \u2013 from accessing exploration and business opportunities to project development and operations. Furthermore, we require all projects to include a carbon price of at least USD 55/tonne, to be resilient towards expected higher carbon taxes. We continue to grow our renewable portfolio. ", "Scenarios \u2013 Equinor has since 2015 annually performed a sensitivity test of its portfolio against the IEA\u2019s energy scenarios in the World Energy Outlook (WEO) report. IEA describes three scenarios: Current Policies, Stated Policies (STEPS) and Sustainable Development (SDS), ", "which represent three different future pathways depending on varying climate policies. These scenarios have different oil, gas and CO\u2082 price assumptions, and these assumptions are applied to our portfolio to test its resilience. The sensitivity testing is a result of a shareholder resolution in 2015 where it was requested to test the portfolio against the range of IEA scenarios to be able to compare results with other companies in the industry. ", "Low-demand scenarios \u2013 The IEA\u2019s SDS scenario is a well below 2C scenario (1.7-1.8 C). According to the International Panel on Climate Change\u2019s (IPCC) report on impacts of a 1.5C scenario, the oil and gas demand needs to be lower in such a scenario than in a well below 2C scenario and thus represents a larger downside for Equinor than estimated in the SDS scenario. To cater for this uncertainty, we have done a sensitivity to the IEA price, where we apply a gradual reduction in the oil price to a long-term price of 50 USD/bbl in 2040, which is 9 USD/bbl lower than the long-term oil price of 59 USD/bbl in the SDS ", "Low carbon \u2014 Creating a low carbon advantage", "Low carbon \u2014 Creating a low carbon advantage", "Equinor Sustainability report 2019Low carbon \u2014 Creating a low carbon advantage"], "9": ["scenario. This sensitivity is illustrated in the chart Change in net present value. The lower the oil price, the higher assumed impact on the net present value of the portfolio. ", "Portfolio \u2013 The portfolio consists of producing assets and non-sanctioned projects. The value of our portfolio represents the total value of our company measured in net present value. Exploration activities are excluded from this portfolio, due to significant uncertainties around potential discoveries and development solutions. ", "Carbon price \u2013 In our decision making, we require all producing assets and non-sanctioned projects in all countries to include a carbon price in their investment case. In countries where there is currently no carbon price in place, we apply USD 55/tonne CO\u2082. This is done to ensure that the asset will be resilient if a carbon price should be introduced. In countries where the current or predicted CO\u2082 price is higher than USD 55/tonne, such as in Norway, where both a CO\u2082 tax and the EU ETS apply, we use the expected CO\u2082 price. We also test the sensitivity of a carbon price of USD 100/tonne to test the robustness of our assets. ", "The figure includes CO\u2082 costs and other environmental costs paid by Equinor in 2019. Costs are reported for Equinor-operated assets only, on a 100% basis. This includes EU Emission Allowances System (EU ETS) quotas, Norwegian CO\u2082 tax and a CO\u2082 related royalty fee in Brazil. ", "Robustness \u2013 Even though we expect a lower value generation in a low-price environment, we consider our portfolio to be robust. For example, the average break- even of our non-sanctioned portfolio of projects coming on stream by 2026 and 2029 is below USD 35/bbl and below USD 40/bbl respectively (volume weighted, upstream portfolio). These are break-even levels we consider to be robust. ", "In a low-price scenario, illustrated by the USD 50/bbl in 2040 sensitivity to the SDS scenario, our producing assets continue to generate a positive cash flow. However, a few assets will have an earlier economic cut-off. Also, most of our non-sanctioned portfolio continues to be profitable, although a few non-sanctioned projects after 2025 could be challenging in such a scenario. However, these projects are still immature and will most likely improve as they are developed. Furthermore, our sensitivity analysis does not consider how the portfolio and possibly frame conditions would change in a scenario where a low oil price persists over time, where costs would be expected to be reduced and adaptations to tax regimes could be anticipated. ", "Resilience \u2013 Equinor follows a set of financial principles that enables us to stay resilient in the long run: \u2022 Cash generation at all times: Assets must be able to provide positive cash flow when prices are low and to be cost efficient when prices are high. Our non- sanctioned upstream portfolio coming on stream the next 10 years has a volume weighted break-even of below USD 40/bbl.", "\u2022 Capture value from cycles: We have demonstrated in the past the ability to create value through the cycles, by adding resources in downturns and optimising the portfolio in upturns. ", "\u2022 Cost competitiveness: We seized the opportunity that arose from the previous downturn to make lasting improvements, and we aim to keep cost levels under control when the prices are increasing. ", "\u2022 Capex flexibility: The oil and gas market are cyclical by nature. When prices fall, we want to be able to reduce our activity quickly and adjust our investment levels in a controlled way. Only investments related to sanctioned projects are committed, and all non- sanctioned projects are flexible. The flexible part of investments is increasing and is estimated to be around 75% of current capex forecast for 2022. ", "Furthermore, we maintain a contingency plan in the event of a sudden price drop like we experienced in 2014. This plan contains measures to reduce cost and investments in the short run in order to stay cash flow positive despite low prices.", "Percent carbon costs relative to value of portfolio", "Impact of IEA scenarios on Equinor\u2019s portfolio The sensitivity analysis performed in 2019 indicates that our portfolio is robust in the IEA scenarios (World Energy Outlook 2019). The chart illustrates the changes in the net present value (NPV) of Equinor\u2019s portfolio when replacing our own assumptions regarding oil, gas and carbon prices with those of the IEA scenarios. For the economic analysis we assume a gradual price development between the specific years for which IEA defines oil and gas prices. We also assume flat prices from 2040 and use Equinor economic planning assumptions for the year 2019. We add a USD 2/bbl transportation cost to the IEA oil price to allow for comparison with Brent Blend. We also use Equinor planning assumptions on carbon price for the NCS throughout all scenarios and vary only carbon pricing for all other countries. For the USD 50 in 2040 sensitivity, we only change the oil price, all other price assumptions are kept unchanged.", "Carbon price sensitivity The chart illustrates that the net present value (NPV) of all future carbon costs represents 7% of total NPV of Equinor. These costs include a carbon price of USD 55 /tonne for all countries from 2020 (except Norway, where CO\u2082 cost is higher). If we apply a USD 100/tonne carbon price, instead of USD 55/tonne, as a sensitivity, the carbon costs will increase from 7% to 9%. The carbon costs calculated with Equinor\u2019s assumptions are higher because we have applied carbon cost for all countries in our portfolio while IEA has not.", "Equinor equity generation capacity 2026 and 2035 include 15.2% share of Scatec Solas ASA", "Future production in renewables (GW) and oil/gas (bbl) Equinor\u2019s renewable production is increasing, and we believe it will continue to increase as we continue to further invest in the renewable business. The current portfolio is dominated by conventional oil and gas. Equinor\u2019s production in conventional oil and gas, which have a relatively low carbon intensity compared to heavier segments, represent 86% of total production.", "Low carbon \u2014 Creating a low carbon advantage", "Low carbon \u2014 Creating a low carbon advantage", "7%Equinor\u2019s planningassumptions4%Current portfolios4%Stated policies6%Sustainable development9%0%2%4%6%8%10%USD 100 CO2price sensitivity40%30%20%10%0%-10%-20%-17%-14%18%36%Current policiesStated policiesSustainabledevelopmentSDS:Sensitivity USD 50 in 2040201920262035Market exposureFixed price levels201920300%10%20%30%40%50%60%70%80%90%100%Norway Brazil Great Britain Norway Denmark Denmark (Total USD 786 million, Equinor-operated assets only, on a 100% basis)"], "10": ["Industry leading carbon efficiency", "In 2019, Equinor reviewed its climate ambitions and launched a new Climate Roadmap at the Capital Markets Update on 6 February 2020. To ensure a competitive and resilient business model in the energy transition, and to contribute to the dual societal challenge of providing energy with less emissions, Equinor aims to:", "Reduce the net carbon intensity, from initial production to final consumption, of energy produced by at least 50% by 2050", "\u2022 \u2022 Grow renewable energy capacity tenfold by 2026, developing as a global offshore wind major \u2022", "Strengthen our industry leading position on carbon efficient production, aiming to reach carbon neutral global operations by 2030.", "Equinor\u2019s Climate Roadmap sets out new short-, mid- and long-term ambitions to reduce our own greenhouse gas emissions and to shape our portfolio. To achieve these ambitions, we need to strengthen our collaboration with governments, customers, and industry sectors to speed up the pace of the transition and deliver solutions at scale. Therefore, it is also a standing invitation to engage in a dialogue and work with us in shaping a more sustainable energy future. ", "Climate is embedded in our decision-making ", "Industry leading in carbon efficiency", "Develop a high value renewable business [1]", "Carbon neutral global operations by 2030[2]", "Absolute GHG reductions in Norway[3] \u2022 40% by 2030 \u2022 70% by 2040 \u2022 Near zero by 2050", "Keep methane emissions intensity near zero by 2030[6]", "Reduce net carbon intensity by at least 50% by 2050[7]", "Equinor aims to reduce the CO\u2082 intensity of its globally operated oil and gas production to below 8kg CO\u2082/boe by 2025, five years earlier than the previous ambition. The current global industry average is 18kg CO\u2082/boe. To achieve this, we assess carbon intensity when we shape our portfolio and work on energy efficiency and emission reduction measures. ", "Reducing our absolute emissions in Norway towards near zero by 2050 In January 2020 Equinor launched new climate ambitions to reduce the absolute greenhouse gas emissions from its operated offshore fields and onshore plants in Norway by 40% by 2030, 70% by 2040 and to near zero by 2050. By 2030 this implies annual cuts of more than 5 million tonnes, corresponding to around 10% of Norway\u2019s total CO\u2082 emissions. ", "A 40% reduction by 2030 is planned to be realised through large scale industrial measures, including energy efficiency, digitalisation and the launch of several electrification projects at key fields and plants, including the Troll and Oseberg offshore fields and the Hammerfest LNG plant. The 2030 ambition is expected to require investments of USD 5-6 billion (NOK 50 billion) for Equinor and its partners.", "Further reduction ambitions towards 70% in 2040 and close to zero in 2050 will entail additional measures, further electrification projects, consolidation of infrastructure as well as opportunities to develop new technologies and value chains. In 2050, Equinor expects Norwegian oil and gas production to be less than half of current levels, assuming development of the defined projects ahead of us, substantial efforts to increase production from existing fields and continued exploration.", "During 2019, the business areas implemented several emission reduction measures, including better energy management, improved technical design, electrification and efforts to minimise methane emissions and flaring. ", "Energy efficiency In 2019, a modification of the compressor system on Gullfaks C and new gear for a Grane gas compressor was installed, reducing CO\u2082 emissions by 35,000 tonnes per year. We also increased the efficiency of ten turbines on nine platforms by changing the inlet filters. This measure alone reduced 17,000 tonnes of CO\u2082 emission in a year. We will continue to implement turbine and compressor efficiency and other energy efficiency measures in 2020. ", "Electrification of offshore assets We are exploring opportunities for further electrification of offshore fields. In 2019, the Johan Sverdrup field came on stream powered by electricity from land, making it one of the most carbon-efficient fields worldwide. CO\u2082 emission reductions from the field due to power from shore are estimated at more than 460,000 tonnes of CO\u2082 per year, totalling almost 20 million tonnes of CO\u2082 over the life of the field. ", "Equinor and partners plan to maximise the utilisation of power from shore for the Utsira High area. In the second phase of the Johan Sverdrup field development, a power hub will be installed, allowing for the Gina Krog, Ivar Aasen and Edvard Grieg fields, as well as Johan Sverdrup second phase, to be powered from the onshore grid. In October 2019, Equinor announced that the area\u2019s license partners are working towards a partial electrification of the Sleipner field, together with the Gudrun platform and other tie-ins. In total ten fields will receive power through the Utsira High area solution, contributing to an average reduction of 1.2 million tonnes of CO\u2082 per year. ", "Together with partners we sanctioned and submitted the Plan of Development for Hywind Tampen to the authorities. This is a project that uses floating wind turbines to generate renewable electricity to supply two oil and gas fields in the Tampen area: Snorre and Gullfaks. Once completed, around 35% of the annual power demand from the five platforms in the area will be met by a floating offshore wind farm. Emissions from the Gullfaks and Snorre fields will be reduced by more than 200,000 tonnes per year. ", "[1] Equity base, installed capacity (GW); reference year 2019 [2] Operational control 100%; including scope 1 and 2 CO2 & CH4 [3] Operational control 100%, Norway; reference year 2005 [4] Operational control 100%, upstream; including scope 1 CO2 [5] Operational control 100%; including CO2 & CH4 ", "[6] Operational control 100% [7] Scope 1 and 2 GHG emissions (100% operator basis); Scope 3 GHG", "emissions from use of sold products (equity production); Energy production (equity); reference year 2019", "Low carbon \u2014 Creating a low carbon advantage Low carbon \u2014 Creating a low carbon advantage", "Equinor Sustainability report 2019 Equinor Sustainability report 2019"], "11": ["Minimising methane emissions Methane is the second most important greenhouse gas contributing to human induced climate change. We have estimated Equinor\u2019s methane intensity for the upstream and midstream parts of the value chain that we control to be as low as approximately 0.03%. Equinor aims to continue to pursue an intensity ambition of near zero. We will continue to develop and implement technologies and procedures to detect and reduce methane emissions, support industry efforts to reduce methane emissions across the oil and gas value chain, increase the quality and transparency of reported data, and support the development of sound methane policies and regulations. ", "Reduced flaring We have set a company-wide upstream flaring intensity target of 0.2% by 2020 for our operated assets. This was set in 2012 as part of our commitment to the Sustainable Energy for All Initiative. Our aim is to eliminate routine flaring in our operations by 2030 at the latest, in line with the World Bank\u2019s Zero Routine Flaring by 2030 Initiative. In Norway we do not have routine flaring in our operations. We have been working systematically to reduce flaring on the Norwegian Continental Shelf (NCS) as well and have seen a positive trend. Reductions have been achieved mostly by changing our operating procedures, such as when starting a well, and due to hardware changes, ", "for example the semi closed flare solution implemented at Statfjord C. We are also investigating reductions opportunities from increasing awareness by better monitoring of flare rates, tuning of separator pressure control and increasing the reliability of important rotating machinery. ", "We currently have flaring from the Mariner field due to gas production exceeding the need for power generation in the early production phase. After a few years, the field will use all its associated gas for energy production and flaring will be stopped. We expect Mariner to meet our commitment to the World Bank 2030 zero routine initiative.", "We still have routine flaring in the Bakken due to challenges related to gas infrastructure. Production growth in this area has exceeded the midstream pipeline capacity, resulting in excess gas being sent to flare rather than to sales. Our Bakken team has identified several mesasures to reduce flaring. However, further improvement actions are required for Equinor to achieve its 2030 ambition of zero flaring from the Bakken field.", "Carbon neutral operations We aim for carbon neutral global operations, for our operated scope 1 and 2 emissions, by 2030. The main priority will be to reduce GHG emissions from our own operations. Remaining emissions will be compensated either through quota trading systems, such as the EU ETS, or high-quality offset mechanisms such as natural sinks. By setting this ambition, Equinor demonstrates its long-standing support to carbon pricing and the establishment of global carbon market mechanisms as outlined in the Paris Agreement. ", "Natural climate solutions, particularly protection of tropical rainforests and other land-based solutions, can contribute up to one-third of the climate efforts the world needs over the next decades. We plan to invest in the protection of tropical forests as an effective measure to combat climate change.", "Floating offshore wind We have a decade of operating experience from floating offshore wind. Up to 80% of the world\u2019s offshore wind potential will likely require floating solutions and Equinor is well positioned to industrialise floating wind. Our ambition is to bring floating wind towards commerciality by 2030. In 2019. the pioneering Hywind Tampen project was sanctioned, having received USD 261 million in support from Enova. In addition to delivering CO\u2082 reductions, this project will be a key driver of technology development and the journey to scale and improved competitiveness for floating wind. ", "Maturing opportunities in onshore We believe in diversifying our offshore wind business and pursuing additional growth options. Having a flexible portfolio gives us the ability to provide power from numerous renewable energy sources including offshore wind, solar and onshore wind. ", "In 2019, Equinor expanded in onshore renewables by investing in a 50% stake alongside YPF Luz for the development of the 150MW Caadn Len wind farm in Argentina. We are also engaged on the owner side with a 50% share of the 162MW Apodi solar production asset in Brazil, and a similar share of the 117MW Guanizul IIA solar project in Argentina that is currently under construction. Both assets are operated by Scatec Solar. In 2019, Equinor increased its total shareholding in Scatec Solar to 15.2%.", "The renewable market is changing and growing at an unprecedented pace, presenting opportunities for decades of growth. Equinor has a strong renewable portfolio in production, and we are leveraging our core competencies in managing complex oil and gas projects when growing in offshore wind. ", "By 2026 Equinor expects to increase our share of installed capacity from renewable projects to between 4 and 6GW (Equinor equity), mainly based on the current project portfolio. This is around 10 times higher than today\u2019s capacity, implying an annual average growth rate of more than 30% in electricity production. Towards 2035, Equinor expects to increase installed renewables capacity further to between 12 and 16GW (Equinor equity), depending on availability of attractive project opportunities.", "Global offshore wind major The past few years have been transformational for Equinor\u2019s offshore wind portfolio. With the recent additions of Dogger Bank (UK) and Empire Wind (US), we are on the path to becoming a global offshore wind major. Dogger Bank will be the world\u2019s largest offshore wind farm development and Empire Wind will provide renewable electricity to to the equivalent of one million homes in New York City. ", "The primary focus for Equinor\u2019s renewables business over the next years will be on safe and efficient operations, developing projects and strengthening competitiveness. Equinor has reached several important milestones in off- shore wind in 2019: \u2022 Secured a 20-year offtake agreement for the ", "strategically important Empire Wind (816 MW) project offshore New York City. ", "\u2022 Achieved scale in development of a North Sea offshore wind cluster through the award of the 3.6GW Dogger Bank project together with SSE, and by securing the area for potential extension of Sheringham Shoal and Dudgeon windfarms in the UK. ", "\u2022 Partially farmed-down the Arkona asset, demonstrating ", "value creation and portfolio optimisation through valuable partnerships. ", "\u2022 Signed Memorandum of Understandings with ", "Korea National Oil Corporation (KNOC) and China Power International Holding (CPIH) to cooperate on development of offshore wind. ", " Enova is a state enterprise owned by the Ministry of Climate and ", "Environment of Norway. Its task is to promote a shift towards more environmentally friendly energy consumption and production, as well as the development of energy and climate technology.", "Equinor Sustainability report 2019Low carbon \u2014 Creating a low carbon advantageEquinor Sustainability report 2019Low carbon \u2014 Creating a low carbon advantage"], "12": ["We aim to increase our equity renewable capacity ten-fold from 2019 to 2026.", "Wind projects in operation and construction", "Equinor Sustainability report 2019Low carbon \u2014 Creating a low carbon advantageEquinor Sustainability report 2019Low carbon \u2014 Creating a low carbon advantage"], "13": ["Accelerate decarbonisation for society ", "While it is critical for Equinor to be at the forefront of the energy transition, we will only succeed if other industries, suppliers, governments and consumers come together to find common solutions. That is why Equinor is committed to taking tangible steps to contribute to accelerating decarbonisation. Our ambition to reduce net carbon intensity by at least 50% by 2050 is a platform for further collaboration with our stakeholders in finding solutions to reducing emissions across the whole value chain. ", "Developing low-carbon solutions More than 85% of the total emissions from oil and gas comes from the use of the products. Equinor aims to develop low carbon solutions to accelerate decarbonisation for society and the industry. We promote CCUS and hydrogen solutions as these technologies can remove CO\u2082 from high-carbon industrial sectors that cannot be easily decarbonised, such as industry, maritime transport, heating and power generation. Maturing and expanding CCUS and hydrogen can only be realised in close collaboration with governments and customers, to establish a commercial framework and build new markets. We also need strategic partnerships with industrial players to ensure safe, reliable and cost-effective implementation.", "CCUS As a leader in CCUS, Equinor is working to build a European value chain, capturing and storing CO\u2082 from industrial plants that have CO\u2082 as a by-product, for example waste management facilities and cement producers. The Norwegian government is a key partner and has also set the ambition to develop a full-scale CCUS value chain in Norway by 2024.", "We are currently involved in the Northern Lights project, together with Shell and Total, which includes the transport and permanent storage of CO\u2082 in a safe reservoir in the North Sea. Northern Lights is part of the Norwegian Government\u2019s Full-scale value chain in Norway demonstration project. In 2019, Equinor has on behalf of the partners signed memorandas of understanding (MoUs) with seven European companies to develop value chains in carbon capture and storage. At the end of 2019, the partnership drilled a confirmation well to study the reservoir\u2019s suitability and capacity for CO\u2082 storage. The partners are currently reducing costs and further developing the Northern Lights project, aiming for an investment decision in 2020.", "Permanently stored reservoir (2500 - 300 meters below the sea bed)", "CO2 Capture Capture from industrial plants", "Hydrogen Combined with our strong position in natural gas, Equinor is prepared for future growth in hydrogen, which offers large-scale opportunities for zero emission energy while leveraging existing infrastructure. By removing CO\u2082 from natural gas, Equinor can produce emission-free hydrogen that can be used in industrial settings, such as power generation and marine fuels as well as residential ones, such as heating. ", "Equinor is currently involved in several hydrogen pilots and projects, such as Zero Carbon Humber in the UK, where we are exploring how hydrogen can help decarbonise the largest industrial cluster in the country. ", "H2 Ammonia in shipping Replacing diesel/fuel oil in the shipping sector", "Clean steel Decarbonisation of the steel industry - replacing coal with hydrogen", "Northern lights A Norwegian full-scale CCS project, including capture of CO\u2082 from industrial sources", "HyDemo Norway Demonstration of natural gas-based hydrogen pro- duction with CO\u2082 removal and storage", "Zero Carbon Humber Aim to build the world\u2019s first zero carbon industrial cluster in the North of UK", "Investing in low-carbon research and technology We believe new technologies and innovation will provide future solutions to energy and climate challenges. This is why Equinor\u2019s R&D projects are essential. Equinor\u2019s current ambition is to increase the low carbon (renewable energy, low carbon solutions, and energy efficiency) share of R&D funding to 25% by 2020. ", "The Equinor Energy Ventures fund, dedicated to invest in attractive and ambitious growth companies in low carbon and new energy solutions, has been operating since February 2016. More than two-thirds of the original USD 200 million has been committed. The fund currently holds thirteen direct investments across different segments and is a limited partner to three financial venture capital funds on two different continents.", "To reduce emissions from our gas turbines offshore, we developed in 2019 waste heat-to-power technology that has the potential to reduce CO\u2082 emissions from offshore installations by typically 15-25%. The technology uses the exhaust heat from gas turbines to generate electric power and heat for process plants through a steam cycle. This UltraLight Bottoming Cycle (ULBC) technology became ready for first use in October 2019. ", "Low carbon \u2014 Creating a low carbon advantage", "Equinor Sustainability report 2019Low carbon \u2014 Creating a low carbon advantageEquinor Sustainability report 2019Low carbon \u2014 Creating a low carbon advantage"], "14": ["to reduce emissions across the oil and gas value chain. We have teamed up with 12 peer companies in the Oil and Gas Climate Initiative (OGCI) to help shape the industry\u2019s climate response. To spur technology development, we are a partner in the USD +1 billion investment fund OGCI Climate Investment. ", "We continue to report on climate-related risks and opportunities in line with the recommendations of the Task Force on Climate- related financial Disclosures (TCFD). To enhance our work on reducing methane emissions, we have joined the One Future Coalition, the Climate and Clean Air Coalition Oil and Gas Methane Partnership and the Guiding Principles on Reducing Methane Emissions Across the Natural Gas Value Chain. ", "We also welcome the constructive engagement with investors participating in Climate Action 100+. As part of this dialogue, Equinor announced new commitments in April 2019 to set climate-related ambitions beyond 2030, explore emission reduction opportunities along the value chain, enhance the link between climate ambitions and remuneration of senior executives and employees, and reviewing memberships in relevant industry associations with regard to indirect policy engagement. ", "Review of membership associations Climate change calls for new solutions and partnerships. We recognise that it is important that our memberships in relevant industry associations do not undermine our support of the Paris Agreement. Our expectations to associations, in which we are a member, are found on Equinor.com. ", "During 2019 Equinor undertook a comprehensive review of its memberships in industry associations that have a position on climate and energy policy. Equinor holds membership and is engaged in more than 100 energy and climate associations and initiatives globally, of which approximately 25% are non- advocacy. We have inquired the associations with an active policy agenda to determine whether their respective climate stance is in alignment with Equinor's. After a screening of more than 80 associations within scope, some of the associations have been subject to a deeper assessment where they were contacted in written and feedback was received. ", "More information about our review on equinor.com", "Need for efficient climate policies Forceful actions are needed to advance the energy transition, enabling society to combat climate change while promoting affordable energy, economic growth, and sustainable development. ", "target the most significant greenhouse gas sources ", "Equinor\u2019s expectations are that policy measures should: \u2022 \u2022 be predictable, transparent and internationally aligned, to trigger investments and innovation \u2022 phase out subsidies on fossil fuels that exacerbate climate change and undermine the effects of other policy ", "measures, such as carbon pricing and efforts to achieve sustainable development ", "\u2022 promote research and development through public measures that stimulate investments in energy efficiency, ", "renewable energy, carbon capture, utilisation and sequestration, hydrogen and other low carbon solutions; and, \u2022 adopt a price on carbon that can deliver material and cost-efficient greenhouse gas emission reductions and a ", "scale-up of investment in sustainable natural carbon sinks. ", "We will increase our engagement with governments and like-minded organisations to support carbon pricing and complementary climate and energy policies. Through these measures, we encourage fuel switching from coal to gas, growth in renewables, the deployment of CCUS and other low carbon solutions, as well as efficient production, distribution and use of energy globally. Since 2000, we have been committed to long-term sustainable value creation in line with the principles of the United Nation\u2019s Global Compact (UNGC). Collaboration We collaborate with peers and business partners to find innovative and commercially viable ways ", "Equinor Sustainability report 2019Low carbon \u2014 Creating a low carbon advantageEquinor Sustainability report 2019Low carbon \u2014 Creating a low carbon advantage"], "15": ["2018. Several new low carbon technology projects were initiated late in 2019 to replace projects exiting the portfolio, but these will first show in indicator in 2020. The total low- carbon R&D expenditure was around USD 59 million, of which around 67% was spent on projects related to CCS and renewables.", "Scope 1 GHG emissions decreased from 14.9 million to 14.7 million tonnes of CO\u2082 equivalents, mainly due to turnaround activities in the midstream segment. We delivered 303,000 tonnes of CO\u2082 emission reductions in 2019, mainly due to many energy efficiency projects. So far, we have achieved around 0.9 million of the 2030 target of 3 million tonnes of CO2 emission reductions per year, set in 2017. ", "Source: IOGP (2019), Environmental Performance Indicators (results are lagging by one year). ", "Emissions and emission reductions In 2019, Equinor\u2019s upstream CO\u2082 intensity (operated) increased from 9.0 to 9.5kg CO\u2082/boe. The increase was mainly caused by lower gas export from the Norwegian continental shelf due to sustained low gas prices. However, Equinor\u2019s upstream CO\u2082 intensity remains considerably lower than the industry average of 18kg CO\u2082/boe. ", "From 2020, with the addition of a full year of production from the electrified Johan Sverdrup field, we expect the CO\u2082 intensity to improve. As such, and due to several identified CO\u2082 emission reduction measures in Norway, the 2030 CO\u2082 intensity ambition has been moved forward to 2025. ", "The methane intensity (operated) remained very low at around 0.03%, which is significantly lower than the industry average of around 0.3% as measured by the Oil and Gas Climate Initiative (OGCI 2018 Annual Report). ", "Our 2019 flaring intensity (upstream, operated) increased slightly from 2.4 to 2.5 tonnes/1000 tonnes of hydrocarbons produced, slightly above the 2020 target of 0.2%. This is significantly lower than the industry average of 1.1%. The increase is caused mainly by a flaring increase at Bakken due to lack of infrastructure capacity to offtake associated gas, as well as flaring at Mariner. Equinor will continue focusing on reducing flaring to achieve the ambition of zero routine flaring by 2030.", "Overall, the climate performance confirms that Equinor\u2019s management approach is effective and that we are well positioned to deliver on the updated climate ambitions.", "Renewable energy and low-carbon research and development (R&D) In 2019, Equinor\u2019s renewable energy production (equity basis) increased from 1.3 to 1.8 TWh. The increase is due to a growing portfolio and the first full year of production at Arkona. Capital expenditure on new energy solutions in 2019 was around USD 0.3 billion. The increase is in line with the strategic direction of growing in renewables, and the management approach is assessed to be effective. Our low-carbon and energy efficiency R&D expenditure was around 20% in 2019, which is a small decrease from ", "tonnes of gas flared per1000 tonnes of hydro- carbon produced", "Low carbon \u2014 Creating a low carbon advantage", "Includes energy efficiency projects and projects with energy efficiency as a secondary effect. ", "[1] Upstream: All operations from exploration to production, excluding onshore gas processing and LNG facilities. (a) Scope 3 figures have been updated to reflect a change in methodology. The change has resulted in a decrease in emissions levels, mainly due to the introduction ", "of a non-energy fraction of sold products. ", "Equinor Sustainability report 2019Low carbon \u2014 Creating a low carbon advantageEquinor [1]Equinor targetIOGP average [2]Upstream CO\u2082 intensity (KPI)(kg CO\u2082/boe, 100% operated basis)[1] Established as a corporate KPI in 2015. [2] IOGP Annual Environmental Performance Indicators report; IOGP members annual survey of upstream oil and gas activities. The results are lagging by one year.051015202015201620172018201920259.7179.8178.8189.09.58.018Annual CO\u2082 emissions reductions(thousand tonnes, 100% operated basis)Annual CO\u2082 emissions reductionsTarget 201920040060020155533243562643032752016201720182019(percentage)0(million USD)05201040156020802510030120201520162017201820192020Low carbon and energy efficiency R&D expenditure(100% operated basis)Share of total R&D expenditures 2020 targetActual expenditure 5717%17%18%21%20%25%52556659"], "16": ["I am visible and engaged in my team\u2019s safety and security", "I stop unsafe behaviours and activities", "I openly report and learn from all incidents", "I systematically use Compliance and Leadership", "I continuously improve safety and security", "I actively search for weak signals and act", "Safety and security at Equinor: Business context and our approach Our safety and security work are guided by our commitment to prevent harm to people's health, safety and security and the environment. The management approach comprises safeguarding people and the environment through design, ongoing reviews of technical and non-technical barriers, proactive maintenance work, periodic risk assessments and emergency preparedness training, as well as through collaboration with our partners and contractors. To improve our results, we regularly evaluate monitoring indicators, review and learn from incidents, conduct verification activities, and implement improvement initiatives as needed. We consider these efforts and the adaptation of the management approach as satisfactory to ensure continuous improvement and as a contribution to our pursuit of zero harm to people and the environment.", "Equinors\u2019 strategy defines \u2018\u2019Always safe\u2019\u2019 as one of its three main elements and our ambition is to be a leader in safety and security in our industry. Based on a review of best practices in previous years, areas for improvement have been identified, and in 2019 several initiatives aimed at strengthening the safety culture and consistency across the company were rolled out. ", "Health and working environment are integral parts of our efforts to safeguard people by focusing on risk management of factors such as chemicals, noise, ergonomic workplace and psychosocial aspects. To reduce downsides and realise sustainable and lasting upsides, we monitor and manage psychosocial aspects on an ongoing basis. As our international presence develops, the company is presented with different sets of security risks that we need to manage. The security threat landscape has evolved significantly since we launched our five-year security roadmap in 2015. Equinor faces a high threat of targeted terrorist attacks in some locations, furthermore, criminal violence is a concern for staff at some of the assets and offices. Worldwide there is a high threat of cyber-attacks, and this is expected to continue to grow. Against this backdrop, we continue to address these threats through a strengthened security culture and organisation which seeks to manage all security risks to our people, assets and information.", "2019 Serious incident frequency (SIF - per million hours worked)", "2019 Total recordable injury frequency (TRIF - per million hours worked)", "Equinor Sustainability report 2019 Equinor. Sustainability report 2019 ", "Always safe - Responsible operations Always safe - Responsible operations", "Equinor Sustainability report 2019Always safe - Responsible operations"], "17": ["Emergency preparedness and response Equinor is a member of an international emergency management work group and has established an international agreement with selected peers regarding joint training and exercises to increase our emergency response capability and competency. ", "Equinor personnel routinely train and exercise on their roles and responsibilities in emergency response situations, to be sufficiently prepared if, and when, incidents occur. In 2019, our emergency response protocols were activated in the aftermath of Hurricane Dorian in the Bahamas. ", "Equinor owns and operates the South Riding Point (SRP) terminal for storage and transshipment of oil, located on Grand Bahama Island. In September 2019, the country was impacted by Hurricane Dorian, resulting in the worst natural disaster in its history. In advance of the impact, Equinor shut down SRP operations and took measures to secure personnel and the facility. In line with normal procedure, our emergency preparedness organisation was also engaged. At the time the hurricane arrived, we had 54 personnel on Grand Bahama. All were confirmed safe and accounted for. However, the terminal sustained damage and an oil spill was confirmed at a volume of 55,000 barrels out of 1,870 million barrels stored. Most of the spilled volumes ", "Actions to improve safety and security In 2019, safety initiatives were implemented through the company-wide improvement project: Safety beyond 2020. The goal has been to further strengthen the safety culture and performance through risk awareness and proactive behaviour at all organisational levels. The project builds on the existing I am Safety governance, which highlights that individuals are personally accountable for safety. Four main areas for improvement have been identified: safety visibility, leadership and behaviour, safety indicators and learning and follow-up.", "Safety visibility has been improved through the implementation of a broad set of actions in all locations. This includes \"Life-Saving Rules\" based on the industry standard from International Oil and Gas Producers association which has been rolled out throughout the company. ", "I am safety expectations at all organisational levels were launched in 2019, this to enhance employee engagement and more active risk management. The aim is to ensure a more consistent behavioural pattern across the company. ", "Safety indicators that improve proactivity; leading indicators, have been given higher priority through increased attention to and follow-up of known underlying causes behind incidents. ", "Establishment and implementation of company-wide processes focusing on closed loop learning and assurance activities are done to ensure better learning and experience transfer. ", "Equinor is currently introducing a new operational planning tool aimed at improving operational safety and risk management at onshore and offshore installations during operations and maintenance. It is designed to strengthen compliance with work processes for safe work, including work permits, safe job analysis, isolation plans and operational risk assessments. Live overview of planned and ongoing activities is displayed along with factors affecting risk exposure such as leaks and seeps, dispensations and other operational conditions. Gathering all safe work information in one system provides a better overview of the total risk picture of the installation and thereby enables improved risk management. ", "were within or near the terminal area. The free oil at and around the terminal has been collected. Clean-up continues in forest areas north-east of the terminal, closely monitored by environmental experts. There have been no confirmed observations of oil on sea water coming from the oil spill. Tests of groundwater from monitoring wells on site in November 2019 show no contamination from the oil spill. Groundwater sampling events will be completed on a quarterly basis throughout 2020.", "over many years. Our workforce is also exposed to risk factors such as noise and chemicals, these areas are followed up in our daily work and through continuous improvement efforts. ", "Security Equinor continues to face a range of physical and cyber security threats that are continuously monitored, evaluated and communicated across the company. ", "An emergency situation with the Viking Sky cruise ship in March 2019 demonstrated that Equinor may contribute to saving peoples\u2019 lives also outside of our own operations. The large cruise ship experienced an engine failure with 1,373 people on board, and it was drifting dangerously close to shallow waters under highly challenging weather conditions. Equinor released three rescue helicopters and four vessels for the rescue operation. ", "Health and working environment A healthy, inclusive and safe working environment is important to ensure safe and efficient operations. To maintain a good working environment in the long term, we systematically monitor trends related to illness, and especially work-related illness. A significant contributor to the latter has been psychosocial aspects and these have therefore been actively managed and monitored ", "Competence development and awareness for all staff is important to strengthen security culture. Our security month in 2019 had the theme See Something, Say Something which was designed to simplify the incident reporting process. An increasing international presence places renewed importance on travel security. We developed specific country requirements for travelers and made them more easily accessible through company Apps and online platforms. ", "The increasing threat to IT systems and information remains a concern and increased focus is given to this area through a series of mandatory cyber-security awareness courses. Email is the most commonly used attack vector followed by infected web sites. Every day more than 500,000 emails are sent to Equinor addresses. More than 50% of these are stopped by technical barriers due to undesirable or potentially harmful content. However, there are still emails getting through that may pose a risk to the company. Our employees are the company\u2019s main barrier in this context, and we are actively working to ensure that all of them have the knowledge and tools they need to reduce the likelihood of malware being uploaded to our network. Over the last five years, all employees have been exposed to tailored phishing emails to test how good they are at capturing suspicious messages. During 2019, we made the emails more complex to improve the ability to identify sophisticated attacks and respond appropriately. ", "The effective interface between security disciplines has been further strengthened through the modification of our security risk assessment tool to combine physical, IT and personal security risk assessments. We have also focused on competency assurance for security risk management experts which is intended to drive standardization and quality.", "Always safe - Responsible operations", "Always safe - Responsible operations"], "18": ["Our performance In 2019, we experienced no major accidents or incidents with fatalities 1.", "However, to learn and improve our business activities we evaluate near-misses and undesirable conditions with respect to the potential for major accidents under slightly different circumstances. Last year we identified two conditions with major accident potential. A pressure vessel valve at the Hammerfest LNG plant in Norway had weaknesses that could have resulted in a situation of overpressure, a large hydrocarbon leakage and subsequent ignition. And a blowout preventer at the Gullfaks C platform offshore Norway had internal damage and design issues that could have caused a well control situation developing into a blowout.", "Serious incident frequency The safety and security of our people and integrity of our operations continues to be our top priority. Over the last decade we have improved our safety performance. However, in 2019 the total Serious Incident Frequency (SIF), which include incidents with potential consequences, ended at 0.6 incidents per million work hours, up from 0.5 in 2018. We are working hard to get back to the positive development we saw and the \"Safety beyond 2020\" project will continue to be our main initiative for improvement. Reducing Line of Fire incidents and enhanced collaboration with our suppliers will be prioritized.", "Personnel health and safety For 2019, the total recordable injury frequency per million hours worked (TRIF) ended at 2.5, which is an improvement from 2018. This is the lowest frequency we have seen, ", "but we must strive to be always safe and will increase our efforts going forward. In particular, the follow up of compliance with Life-Saving Rules will be strengthened. ", "The last three years we have had a steady and significant improvement in the number of work-related illness cases (WRI). Despite of seeing an increase in WRI from 2018 to 2019, the number of WRIs\u2019 is still low for 2019. Psychosocial aspects are one of the key contributors to this development, along with noise and ergonomic conditions. The average score of our global annual survey relating to issues of psychosocial aspects developed positively in 2019. ", "The sickness absence rate for our Equinor ASA employees was 4.4% in 2019, down from 4.6% in 2018.", "Process safety We continued to see a reduction in the number of serious oil and gas leakages (with a leakage rate \u2265 0.1 kg per second) for the fourth consecutive year and our target of a maximum of ten leakages was reached. This is the lowest number since 2012.", "The number of oil spills per year decreased compared to last year. Close to 90% of the total number were spills with volumes less than a barrel. In 2019, we experienced a large and serious spill. Hurricane Dorian hit Grand Bahama Island and our South Riding Point terminal for storage and transshipment of oil and caused a spill of 8 744 m3. For further details see chapter on Emergency preparedness and response.", "No serious well control incidents were recorded in 2019.", "Total serious incident frequency (SIF) (KPI)", "Total recordable injury frequency (TRIF) (KPI)", "Serious oil and gas leakages - (KPI) (number per year)", " The incident caused by the Hurricane Dorian that hit Grand Bahama Island and our ", "South Riding Point terminal is being investigated and the final classification is not concluded. ", " The oil spill following Hurricane Dorian that hit Grand Bahama Island and our South Riding Point terminal accounts for 97% of the total volume. In December 2018 a HC-leakage occurred on Statfjord B. The investigation report, released in March 2019, classified the leak with an actual severity to be ", "included in the KPI, thus leading to a restated number of Oil and gas leakages for 2018.", "Equinor Sustainability report 2019Always safe - Responsible operationsEquinor Sustainability report 2019 Always safe - Responsible operations(million hours)Total serious incident frequencyTarget 2019Hours worked0.60.80.60.50.60.401002003004000123420152016201720182019(million hours)Total recordable injury frequencyTarget 2019Working hours2.72.7125.3128128.9123.71472.82.82.5(cubic metres)1,8003,6005,4007,2009,000(number per year)6012018024030020152016201720182019Number of spillsVolume of oil spills172146207238219316134138898321010203020152016201720182019Target 201918151210Oil and gas leakages"], "19": ["Business context and our approach Responsible management of our environmental impact is of great importance to Equinor. As a large offshore oil and gas operator and a growing offshore wind power provider, we have identified responsible management of the oceans as a sustainability priority area. ", "Significant environmental aspects of our offshore activities include discharges of produced and processed water to sea, management of drilling waste and potential effects on marine biodiversity (e.g. marine mammals, corals and birds). For our onshore processing plants and refineries in Norway and Denmark, SOx emissions and discharges of treated water to sea are significant environmental aspects. ", "In our onshore US operations, significant environmental aspects are related to water sourcing and usage for the hydraulic fracturing process, robust well design and operational procedures to minimise impacts to the environment, and waste management for drill cuttings and produced and flowback water.", "Our environmental management approach, as described in the Equinor Book and internal policies, entails identification of significant impacts, collaborative research projects to build knowledge, environmental baseline studies, impact assessments and monitoring programmes. Our approach includes establishing measures tailored to local conditions and aimed at avoiding, minimising or mitigating any effects. We regularly assess our performance through reviews and assurance activities and set actions to improve when needed. Our environmental work is guided by our commitments to prevent harm to the environment, aim for outstanding natural resource efficiency and comply with all applicable environmental laws and regulations. ", "Our environmental performance indicators vary over time in line with variations in the operational activity level and type. Turnarounds, start-ups, the number of wells drilled, wells fractured and floatels used, and temporary operational irregularities are main factors influencing positive and negative changes in performance data. Our environmental performance is, even with these variations, considered to be in line with our aim to prevent harm to the environment. ", "More information on Impact assessments on equinor.com", "Our actions To manage our significant environmental aspects we have through 2019 focused on the areas below.", "Sustainable management of the oceans Our capabilities in sustainable ocean management have grown throughout our history of developing and operating offshore assets and our coexistence with other maritime actors. ", "In 2018 we became one of the founding patrons of the UN Global Compact Action Platform for Sustainable Ocean Business. The platform is a three-year global programme that brings together business, civil society, the UN and governments to advance the ocean economy and sustainable development. In 2019, Equinor contributed to the development of the Ocean Opportunities Report and UN Global Compact Principles for Sustainable Ocean Business, launched in September 2019. Equinor has signed up to these nine principles.", "In support of combatting plastic pollution of the oceans we participate in an initiative together with the International Association of Oil and Gas Producers (IOGP), national and EU authorities for assessing the use, regulation, limitations and possible substitution of chemicals factually or potentially containing microplastic. Use of water-soluble products containing microplastic are not allowed in our operations, and we enforce strict restrictions on use of products containing microplastic in oil-based fluids, i.e. fluids not discharged to nature. We share the general concern related to plastic pollution of the ocean and continue the work to identify and substitute chemicals we use that contain microplastics.", "Water management and resource efficiency The majority of our offshore oil and gas platforms and onshore processing plants and refineries discharge produced and processed water to the sea. The objective of managing discharged water is to minimise volumes, uphold very low levels of dispersed hydrocarbons and use of chemicals, and replace chemicals with more environmentally friendly substitutes. The water is cleaned to the extent practically and technically possible, but small amounts of dispersed oil, natural components and chemicals are unavoidable contaminants. The oil-in-water content and chemical composition of water discharged to ", "sea is closely monitored to ensure it stays within regulatory limits. In some cases, especially during periods of varying process conditions, produced water is dispatched together with crude oil through pipelines to onshore plants for treatment. Improved work processes and an IT tool for water management have been implemented.", "In our US onshore shale operations, water sourcing and usage is accomplished through careful project planning and coordination with landowners, regulatory agencies and local water authorities and communities. The aim is to responsibly manage water throughout the life span of our activities. We aim to use only what is needed, so that impacts to surface and groundwater sources and disposal volumes are minimised. We continuously monitor water usage in our operations to optimise reduction efforts and assess water stress, where relevant. ", "Injection of CO2 along with water in well fracturing operations provides an opportunity to increase well production and reduce use of water. In 2019, several pilots using third-party CO\u2082 for hydraulic fracturing were safely executed by at Bakken. Further applications of this new technology will be considered based on safety, logistics, and sustainability considerations, as well as project economics.", "We follow rigorous technical and operational standards for well design and operations, including standards for the types and volumes of chemicals used in drilling and hydraulic fracturing fluids. We disclose the chemicals used in hydraulic fracturing through FracFocus1.", "Drilling operations create large quantities of rock cuttings contaminated with drilling mud and fluids from the rock formations. These rock cuttings are in many offshore cases grinded into a slurry and injected into subsurface formations for permanent storage. In other cases, rock cuttings are collected and transported to shore for cleaning and disposal or, in cases where water-based mud is used, discharged to sea. In many cases where oil-based drilling mud is used, transport of drill cuttings to shore for treatment and disposal is needed, requiring comprehensive logistical solutions and waste handling onshore. Thermomechanical cuttings cleaning (TCC), in which oil is removed from the drill cuttings through mechanical friction and heating, offers improved treatment of drill cuttings offshore and makes discharge of such cutting ", "1 The US national hydraulic fracturing chemical registry.", "material to sea environmentally acceptable. A TCC unit has been installed at the Johan Sverdrup field. Recent studies including effect studies of TCC-treated cuttings as seafloor deposits, confirm compliance with regulatory requirements and show no risk of adverse effects to the environment.", "Protecting biodiversity and eco-systems In line with increasing concerns about the global decline in biodiversity and ecosystems, Equinor has identified this environmental area as a priority area for review of our management approach and to identify improvement opportunities. Potential effects on biodiversity from our operations are mainly related to marine life in the Barents Sea and offshore the US east coast, birds in relation to wind farms offshore the UK and invasive corals at our offshore facilities in Brazil. ", "Barents Sea We have built knowledge of the marine environment and potential effects of our activities on marine life through baseline studies, impact assessments, monitoring programmes and research studies over decades. ", "In connection with the ongoing development of the Johan Castberg field, passive acoustic monitoring stations have been deployed in the project area to improve our understanding of the presence, abundance, diversity and migration of marine mammals in the south western area of the Barents Sea. The data will be used to inform future operational activities at the field. ", "Equinor was instrumental in the extension of the SEATRACK programme for the years 2019 -2022. SEATRACK aims to map the non-breeding distribution of seabirds in colonies encircling the Barents, Norwegian and North Seas, which includes colonies in Russia, Norway including Svalbard and Jan Mayen, Iceland, the Faroe Islands and Great Britain. SEATRACK is a collaboration between Norwegian authorities, research institutions and the oil and gas industry. MARAMBS, another collaborative research project, was finalised in 2019. It involved a modelling study providing high-resolution data for marine mammal and sea bird distribution in the Barents Sea.", "To further enhance our knowledge basis, we have participated in research projects like the E&P Sound & Marine Life Programme, studies of habitat preferences ", "Always safe - Responsible operations", "Always safe - Responsible operations"], "20": ["for polar bears, density modelling of whales and dolphins, distribution modelling of bird species and studies to increase our general knowledge on ice edge ecosystems. Offshore wind \u2013 UK and USA Equinor\u2019s Empire Wind offshore wind project, currently under development, has engaged in a pioneering partnership with conservation scientists to protect the endangered North Atlantic right whale. The collaboration with the Wildlife Conservation Society has deployed two high-tech whale monitoring equipment in the lease area. The real-time monitoring tool will be an effective way to detect large whale species during construction activities and will also provide scientists with significantly more spatial and temporal distribution data, which will be helpful to identify the best way to protect the species.", "The Dudgeon offshore wind farm is considered to be within the foraging range of Sandwich terns breeding in the North Norfolk Coast Special Protection Area. To provide a better understanding of the foraging behaviour of Sandwich terns and their interaction with Dudgeon and other nearby offshore wind farms, Equinor has undertaken an ornithological monitoring programme over four years.", "Brazil Biodiversity aspects are a focus area for our operations in Brazil and improvement initiatives have been undertaken in collaboration with the local chapter of the World Business ", "Council for Sustainable Development. In preparation for operations on the Carcar field, a comprehensive baseline study was conducted. The assessment included analysis of the sea water column and sediments, including of organisms therein, in the Carcar area. We have also performed visual inspections of the seafloor in order to confirm the absence of deep-water corals or any other sensitive environment.", "A particular challenge is the invasive sun coral, which is currently spreading along the Brazilian coastline and competing with native coral species. To control the presence of this invasive species in the Peregrino field, a risk tool has been developed to assess the potential of vessels operating in the field spreading corals, so that relevant mitigating actions can be taken. ", "Australia As part of planning for the Stromlo-1 exploration drilling programme in the Great Australian Bight, a comprehensive Environmental Plan (EP) was finalised and submitted to the authorities in 2019. The EP, which took two years to develop, was accepted by the regulator in December 2019. The work included co-funding extensive baseline surveying of the deep-water environments and the met-ocean conditions of the Great Australian Bight. More information about the EP and related engagement activities is found in the Respecting human rights chapter in this report and on our web-site. ", "Our performance Emissions and discharges NOx emissions have decreased by 2% from 2018 to 2019, largely due to reduced drilling activities in the tight oil segment. SOx emissions increased with 22%, mainly caused by downtime of the sulphur treatment unit during a planned turnaround of the Mongstad refinery. Given the planned duration of the turnaround, the expected soon return to regular conditions and that these emissions cause no significant environmental impact, it was decided to continue operations for the upstream unit throughout the turnaround. Mitigating actions were implemented to reduce throughput for the plants giving sulfur contributions. The SOx emissions have been within the permit level. The experience from this turnaround is taken into account for planning of shutdowns in the future. Regular discharges of oil to water increased by 9% since 2018, mostly due to higher volume of produced water from wells. Emissions of non-volatile organic compounds were reduced by 13%, mainly as a result of a decrease in oil loading volumes on the Norwegian continental shelf.", "Waste and fracking chemicals Hazardous waste quantities increased by 30% from 2018 to 2019, as large process water volumes from the Troll field were dispatched through pipelines to shore and shipped to external contractors as waste, instead of being remediated at our own facilities. Non-hazardous waste quantities increased by 29% mainly due to large volumes of polluted soil from ground work and tank cleaning at the Kalundborg refinery.", "The volume of drill cuttings from US onshore operations, classified as exempt waste, increased by 53% in 2019. The increase is mainly due to cuttings being transported as waste to landfill sites rather than collected in on-site disposal pits. Management of such waste varies with location and landowner preferences and causes year to year variations in solid exempt waste. The disposal of liquid exempt waste has increased by 17% since 2018 due to higher amount of produced water from wells. Use of fracking chemicals has decreased by 15% due to reduced fracking activity at Bakken and Eagle Ford in 2019.", "Always safe - Responsible operations", "Always safe - Responsible operations", "Equinor Sustainability report 2019 Always safe - Responsible operationsEquinor Sustainability report 2019 Always safe - Responsible operations0.511.522.533.5201520162017201820190Sulphur Oxides (SOx)(thousand tonnes)2.51.81.71.82.2Regular discharges of oil to water(thousand tonnes)00.20.40.60.811.21.41.6201520162017201820191.41.41.21.11.2"], "21": ["Water Most of Equinor\u2019s operations are offshore or in areas of abundant water availability. For our onshore US operations, the main part of the Eagle Ford asset, which Equinor divested from in 2019, and a smaller part of the Bakken asset were for 2018 reported to be within a high or extremely high baseline water stress area. However, the latest version of the Aqueduct tool (owned by World Resources Institute) for which the hydrology model and other parameters were updated during 2019, shows that none of our operations are in areas of high or extremely high water stress. The consumption of freshwater has decreased by 8% due to reduced fracking activity at Bakken and Eagle Ford in 2019.", "Protected areas and areas of high biodiversity value Equinor is concerned with valuing and protecting biodiversity and the ecosystem. Equinor is an active participant in a joint Biodiversity and Ecosystem Services Working Group of IPIECA and IOGP. This cooperation has resulted in the development of specific tools and recommendations for industry best practice. We also support the maintenance and development of the World Database on Protected Areas. These databases are used actively in environmental risk and impact evaluations. An overview of the number of operational assets, and licenses with exploration activities which are located inside of or close to protected areas, can be seen below. Equinor did not have operations in protected areas in 2019.", "Operating sites in and around protected areas and areas of high biodiversity value in 2019 (Equinor operated).", "In the vicinity (5 \u2013 20 km)3 - of protected areas - of areas high biodiversity value ", "Close (1 \u2013 5 km)3 - to protected areas - to areas of high biodiversity value ", "Adjacent (< 1 km) - to protected areas4 - to areas of high biodiversity value ", "Inside - protected areas - areas of high biodiversity value ", "1) Assets means installations and plants in operation or under construction 2) Licenses includes only those licenses where there have been operational activities other than 1) above, e.g. seismic 3) For assets and licenses further away from protected areas and areas of high biodiversity value there should be no interaction during normal operations. Potential interactions with designating features of the protected areas are addressed during EIA processes and relevant monitoring plans are put in place 4) All assets adjacent to protected areas, except one, are subsea pipelines while the protected areas are located on islands. The last asset, Kalundborg refinery, is located next to an IUCN category IV protected area. Under normal operations there is no ", "interaction between the protected areas and these assets. ", "Acid gases and non-methane volatile organic compounds", "Non-methane volatile organic compounds (nmVOC)", "Exempt waste generated: cuttings and solids [1]", "Exempt waste generated: produced water and flowback [1]", "Share of production in areas of high water stress [5]", "OC = Operational control. NR = Not reported.", "These are therefore not included in the hazardous or non-hazardous waste and waste recovery figures. In 2016 a change was made in the categorisation of recovered waste, allowing for the inclusion of treated oil contaminated water.", "[1] Drill cuttings, and produced and flow-back water from our US onshore operations are exempt from regulation as hazardous waste. [2] [3] Related to our US Onshore operations. [4] Total freshwater withdrawal is for Equinor activities equal to total freshwater consumption, since no water is returned to source. [5] The hydrological model in the Aqueduct tool was updated in 2019. This change had as impact that the water stress categorisation (a) Historical figures have been updated to correct an unintended systematic over-reporting of the freshwater withdrawal in the tight oil segment.", "of our Eagle Ford and Bakken assets is now at levels below high and extremely high baseline water stress.", "Always safe - Responsible operations", "Always safe - Responsible operations", "Equinor Sustainability report 2019 Always safe - Responsible operationsEquinor Sustainability report 2019 Always safe - Responsible operations"], "22": ["Business context and our approach The safety of our employees and others affected by our operations, including workers of our contractors, is at the heart of our business. Our strategic commitment to always safe also translates into an expectation to respect internationally recognised human rights of people affected by our operations. ", "In our human rights policy, created in 2015, we have committed to conduct our business consistent with the United Nations Guiding Principles on Business and Human Rights, the ten principles of the Global Compact and the Voluntary Principles on Business and Human Rights. The policy addresses the most relevant human rights issues pertaining to our operations and role as an employer, business partner, buyer, and to our presence in local communities. These issues include a commitment to provide a safe, healthy and secure working environment, and to treat employees and those impacted by our operations fairly and without discrimination. More information on how we work with these topics in relation to our own employees can be found in the sections regarding people and safety in this report. Our specific efforts to prevent modern slavery in our operations and values chains are described in our annual UK Modern Slavery Statement, available online. . Our actions Human rights review As part of Equinor\u2019s integrated approach to the management of sustainability performance, progress of the human rights policy implementation was assessed. As a result, a human rights improvement project was established with the aim of strengthening processes and capabilities in our company, supported by a corporate-level action for 2019. Additional developments include the creation of a new position, Vice President of Human Rights, and the reorganisation of the Human Rights Steering Committee to be attended by select members of the corporate executive committee. More information about the governance of human rights within Equinor can be found on our webpages. ", "Human rights risk assessments In 2019, we implemented the human rights risk assessment methodology, allowing risk to people\u2019s human rights to be reported for the first time through our risk management system. By including these risks in our management system, our processes now require human rights risks of a certain ", "We must work systematically to integrate human rights in our normal way of doing business", "severity level to be reported to the organisation levels above, including to the CEO and the Board of Directors. The identified potential impacts related to Equinor\u2019s business covered 11 separate categories of rights, categorised by employees, workers in the supply chain and local communities. ", "This process has been supported by significant training and awareness sessions, and as a result we have seen improvements in the quality and depth of reporting between the two periods. We believe this risk identification process will support more effective approaches to mitigation and remediation going forward.", "Awareness raising and training At Equinor we believe that a rights-respecting culture can only be achieved if it is led from the top, which is exemplified by our CEO\u2019s keynote speech at the fifth annual Thorolf Rafto Challenge at the Norwegian School of Economics in Bergen. A transcript of his speech is available online.", "During 2019, we continued our efforts towards awareness and training on human rights across the company. The senior leadership team continued to develop their approach to human rights throughout 2019, discussing the topic for more than six hours in the corporate executive committee meetings. In addition, our human rights efforts were discussed and evaluated in two meetings by the Board of Directors Safety, Sustainability and Ethics Committee and once with the full Board of Directors. Every business area management committee and most functional management teams have conducted targeted awareness sessions at least once. ", "In 2019, we continued to hold training sessions with select groups, focusing on identifying and managing human rights risks and impacts from our activities and throughout our supply chain. This year, more than 400 employees were trained through a full-day classroom course on Supply Chain Management Ethics, anti-corruption and human rights. This included all safety and sustainability leaders in the business area Technology, Projects and Drilling; the procurement teams in, amongst others, Brazil and Nicaragua; and for personnel involved in supply chain activities at Krst, Norway. Furthermore, personnel from select suppliers in Brazil joined a two-hour training session on human rights in the supply chain. Additionally, Shift Project has delivered a full-day training with over 30 representatives from the Legal function. In total, over 500 employees attended classroom-based targeted training sessions.", "We see from post-course feedback that attendees consider these training sessions to increase specific awareness of human rights issues related to their work, leading to changed behaviours when assessing risks, following up on issues, and ensuring that human rights is included when scoping work. ", "Our e-learning program on human rights has been revisited and is now made available in three languages. We have also created a stand-alone human rights page on our external website, with our human rights policy translated into seven languages relevant to our business activities.", "Engagement and grievance mechanisms Engaging with potentially affected stakeholders is imperative to inform our operations and business plans. Grievance mechanisms form an important part of our stakeholder engagement process. Our human rights policy states that we will provide or cooperate in providing appropriate remediation if we have caused or contributed to adverse human rights impacts. In addition, Equinor has an ethics helpline available to all our employees and third parties who want to communicate concerns. Our operational-level grievance mechanisms cover our activities in Brazil, Tanzania and our Empire Wind operations in the USA. In addition, all seismic surveys and our renewable projects are covered by operational- level grievance mechanisms. During 2019 there were no concerns raised through our operational-level grievance ", "Equinor Sustainability report 2019 Always safe - Responsible operationsEquinor Sustainability report 2019 Always safe - Responsible operations"], "23": ["mechanisms, and none of our business activities involved involuntary resettlement or relocation of people. ", "Australia As part of our consultation with affected people in 2019, we published a 1,500-page Environmental Plan (EP) for the Stromlo-1 Exploration Drilling Program in the Great Australian Bight. The process included extensive engagement with stakeholders, supported by an EP in Brief to help the community interpret the technical document. We held a series of drop in sessions and published a Statement of Response to Public Comment on our website, creating transparency toward the improvements made to our EP in response to stakeholder submissions. This process allowed us to include public interest updates to the EP when resubmitting to the Australian regulators in September 2019. ", "Brazil As a major offshore operator, it is particularly relevant for Equinor to keep close engagement with fisheries. Fishermen operating offshore Brazil are impacted by our offshore activities through the regulatory prohibition on fishing near offshore installations. During 2019, Equinor and partners were responsible for training approximately 300 local fishermen to act as response teams in the event of an oil spill at sea, with the purpose of ensuring the safety and protection of marine and coastal environments. The process has resulted in formal certifications for the fishermen and their vessels, creating positive safety results and expanded livelihood opportunities for the fishing communities. ", "UK Similarly, engagement has been important for the Dogger Bank Offshore Wind Farms project, where fisheries were identified as potentially affected stakeholders both during construction and operations. Through regular collaborative engagement, a draft Fisheries Liaison Plan including a proposed grievance mechanism for fishing gear damage has been proposed. The plan has been shared with relevant stakeholders for feedback and will be published once received by regulators. ", "We recognise that our efforts in this space is a continuous journey of improvement. As such, the human rights improvement project conducted an analysis during 2019 to explore how we can ensure ongoing improvement of identification and engagement with potentially affected stakeholders, paying attention to our activities in, amongst others, Argentina, Nicaragua and Mexico.", "Human rights in the supply chain The supply chain continues to be an important focus area for our human rights efforts in Equinor. ", "This year, Equinor\u2019s Human Rights Expectations to Suppliers were launched and there will be supported by a guidance document providing practical advice for how to live up to these expectations. These efforts continued alongside our onsite assessments with more than 50 suppliers across 16 countries. The assessments have enabled us to identify gaps and areas of improvement in collaboration with our suppliers to ensure that potential harm to people is reduced or eliminated. ", "During 2019, we piloted a new way of identifying potential negative impacts on workers\u2019 human rights related to supplier conduct, moving from company-focused audits to worker dialogue-focused reviews, enhancing our risk identification abilities and granularity. In 2019, we continued this work and performed renewed engagement with workers to help us understand if the implemented actions improved their lives. This renewed engagement confirmed that the efforts taken by our supplier had resulted in return of passports, tighter control of working hours and a strengthened recruitment due diligence process which has significantly reduced worker paid recruitment fees for newly recruited workers compared to 2018. In this case, we believe that this continued engagement is an effective way of measuring results. ", "Building on the learnings from this pilot, we initiated another supplier engagement programme following the same approach. Here, we have seen positive outcomes for workers through the discontinued practice of retention of worker ID documents, improved conditions in accommodation and sanitation areas, and discontinued fees for work mistakes. The positive steps from these two cases would not have been possible without the close collaboration with our direct suppliers, who have also updated their own internal procedures and allocated staff to develop their own practice in this area. This will be supplemented by the adoption of the Employer Pays principle for all new direct and indirect hires from 01 January 2020 by this supplier, as well as through ongoing due diligence of manning agencies in source countries, where this principle will be updated into agency agreements. ", "Following the agreement of peer collaboration on human rights supplier assessments in 2018, a platform for sharing and viewing of assessments has been developed and will be launched in 2020. This industry-first initiative will drive collaboration in the follow up process towards energy company suppliers. ", "In 2019, we focused our efforts towards targeted groups and areas, to further improve the effectiveness of our actions. We experienced increased openness to address risks and dilemmas, more active engagement and reflection around company values, and demand for more training to tackle challenges. We consider all these behaviours to be indicators of improvements in embedding a rights-respecting culture.", "Findings - human rights verifications 2019 Findings from human rights assessments 2019", "In our supply chain work, we focused more deeply on mitigation, and saw specific actions being defined and progressed based on our targeted worker-based reviews. Until meaningful leading and performance indicator are created, our progress and performance will be assessed on anecdotal evidence. ", "Through human rights supplier verifications we identified gaps both with regards to management system and implementation. We pay particular attention to findings that are considered potential markers of modern-day slavery and collaborate with the suppliers to improve and close the gaps. ", "Employee training (internal learning) ", "Class room course training days per employee", "E-learning participations per employee", "Labour rights and working conditions in the supply chain", "Supplier human rights (HR) verifications conducted", "Countries in which supplier HR verifications undertaken", "Employees working with our suppliers trained (class room course)", "Equinor Sustainability report 2019 Always safe - Responsible operationsEquinor Sustainability report 2019 Always safe - Responsible operations7455465877161159Management systemWagesWorking hoursMinimum age of labourRecruitmentNon discriminationFreedom of associationStandards own suppliersEmployment terms"], "24": ["Our performance The number of cases received through the Ethics Helpline was 194 in 2019, an increase from 182 in 2018. The cases received included 62 reported concerns relating to harassment, discrimination and other conduct affecting the working environment. We experienced a decrease in the number of cases related to our suppliers. ", "In our opinion the Ethics Helpline reporting works well. Based on a review of the reported concerns and the number of reports received through the Ethics Helpline in 2019, we do not see any immediate need for an adjustment to the management approach. However, we work continuously with improving our processes. ", "Promoting integrity and transparency", "Business context and our approach Equinor is a global company with a presence in parts of the world where corruption represents a high risk. With a strategy to accelerate internationalisation and increase investments in new energy markets, 2019 represented a year of continued focus on ethics and anti-corruption. ", "Equinor is committed to conduct our business in an ethical, socially responsible and transparent manner. We maintain an open dialogue on ethical issues, both internally and externally. ", "Code of Conduct - The Code of Conduct sets out our commitment and requirements for how we work at Equinor. It applies to employees, Equinor board members and hired contractors. We train our employees on how to apply the Code of Conduct in their work. All Equinor employees are required to confirm annually that they understand and will comply with the Code of Conduct. We expect our suppliers to act in a way that is consistent with our Code of Conduct. We engage with our suppliers to help them understand our ethical requirements and how we do business. If the expectations are not met, we take appropriate actions.", "Anti-bribery and corruption - Our Code of Conduct explicitly prohibits engaging in bribery and corruption in any form. Equinor\u2019s Anti-Corruption Compliance Program summarises the standards, requirements and procedures implemented to comply with applicable laws and regulations and maintaining our high ethical standards. Our group-wide policy ensures that anti-bribery and corruption risks are identified, and measures are taken to mitigate risk in all parts of the organisation and that concerns are reported. We maintain a global network of compliance officers responsible for ensuring that ethical and anti- corruption considerations are integrated into Equinor activities no matter where they take place. ", "to discuss concerns with their leader or the leader\u2019s superior or use available internal channels to provide support. Concerns may also be reported through our Ethics Helpline. The helpline allows for anonymous reporting and is open to employees, business partners and the general public. Equinor has a strict non-retaliation policy.", "Tax transparency and payments to governments reporting - We believe that through disclosure of payments to governments we promote accountability and build trust in the societies where we operate. We have reported our payments to governments on a country-by-country basis for more than a decade. Since 2014, we have reported such payments on a project-by-project and legal entities basis, in our Annual Report and Form 20F. This reporting represents a core element of transparent corporate tax disclosure. Since 2018, we have published our global tax strategy, available online. These disclosures are in line with our commitment to conduct our business activities in a transparent way. ", "Equinor provides regular training across the organisation to build awareness and understanding of the Anti-Corruption Compliance Program. Our in-person workshops are designed to facilitate meaningful in-depth discussion on specific issues tailored to the nature or location of their role. ", "Reporting and handling of concerns \u2013 The Code of Conduct imposes a duty to report possible violations of the Code or other unethical conduct. We require leaders to take their control responsibilities seriously to prevent, detect and respond to ethical issues. Employees are encouraged ", "Our actions Anti-bribery and corruption compliance - Our ethics and anti-corruption training efforts during 2019 included both general and targeted training sessions through a combination of e-learning and workshops. In 2019, we had particular focus on integrating money laundering into to our anti-corruption workshops to increase awareness of money laundering risk within the organisation. ", "In 2019, we increased the number of targeted tailored ", "trainings to employees appropriate to the nature or location of their role.", "During 2019, we had a companywide Code of Conduct campaign focusing on the main provisions of the Code. The responsibility for reporting concerns was a part of this campaign. In addition, communication of the Ethics Helpline was included in the company\u2019s security month, in our training sessions and in Ethics Committees. ", "Working with suppliers and partners \u2013 During 2019 we continued our interaction with suppliers and partners on ethics and anti-corruption regarding the risks that we jointly face and actions that can be taken to address them. We proceeded our sustainability and compliance sessions with events in Russia and Azerbaijan, meeting with partners and suppliers discussing common efforts to strengthen compliance programs. Risk-based verifications of selected suppliers were carried out. To strengthen our management of third-party corruption risk in non-operated joint ventures we focused in 2019 on targeted training of Equinor\u2019s dedicated asset teams and management. ", "Collaboration and stakeholder engagement - Equinor believes in the value of collective action to actively promote anti-corruption and transparency. We have long standing relationships with the UN Global Compact, the World Economic Forum\u2019s Partnering Against Corruption Initiative (PACI) and Transparency International (TI). ", "Equinor has been a supporter of the Extractive Industries Transparency Initiative (EITI) for many years, through board and committee representation and active participation in working groups. An Equinor representative is elected member of the EITI international board. Through this work we exchange knowledge and demonstrate our continued commitment to contribute to improved governance and greater transparency in the extractive sector. In 2019, we were present in ten EITI-implementing countries. We provided USD 60,000 in regular annual financial support to the international EITI. In addition, Equinor contributed USD 25.000 in support of the EITI Global Conference hosted by the French Government as part of the French presidency of the G7.", "Equinor Sustainability report 2019 Always safe - Responsible operationsEquinor Sustainability report 2019 Always safe - Responsible operations621153282515People and workplaceSafety and securityEnvironment and communitiesPartners and supply chainAsset and business integrityTests, questions and other"], "25": ["During 2019, we have engaged with local industries and suppliers to support major project developments in core areas.", "US This year Equinor\u2019s Empire Wind project successfully bid in the United States\u2019 first large- scale competitive offshore wind solicitation. Our winning bid represents an important milestone for Equinor\u2019s ambition to build an offshore wind core area on the US East Coast. The 816-megawatt (MW) offshore wind project will bring renewable energy to New York consumers, contribute to the state\u2019s ambitious renewable energy development goals, and provide significant economic benefits to New York. The project is expected to be developed with 60-80 wind turbines, with an installed capacity of more than 10 MW each. Total investments will be approximately USD 3 billion, and the project will be able to power over 500,000 homes in New York, with an expected start-up in late 2024.", "Norway This year Equinor and the Johan Sverdrup partnership consisting of Lundin Norway, Petoro, Aker BP and Total, started production from the giant field in the North Sea. Johan Sverdrup has expected recoverable reserves of 2.7 billion barrels of oil equivalents and the full field can produce up to 660,000 barrels of oil per day at peak. In the operational phase, an average year will generate around 2,700 man-years, and during the full field development 3,400 man-years of work opportunities will be generated. The Norwegian supply industry may receive more than 50% of the assignments during the construction phase, and around 90% in the operational phase.", "This year Equinor also signed contracts for the Hywind Tampen wind farm development. This project will contribute to further developing floating offshore wind technology and reducing the costs of future floating offshore wind farms, offering new industrial opportunities for Norway, the licenses and the Norwegian supplier industry in a growing global offshore wind market.", "UK The Equinor operated offshore wind farms Sheringham Shoal, Dudgeon and Hywind Scotland are supporting local communities through community funds or local educational initiatives and sponsorships.", "The Mariner project supports around 700 long term jobs and between 80-90% of the contracts for offshore work during the production phase were awarded to UK-based suppliers. The project will create ripple effects in the local supply chain for the next 30 years of production. In the UK, Equinor works closely with the local supply chain and peers, focusing on collaboration and digitalisation to improve industry performance. ", "Brazil Equinor\u2019s social investment and sponsorship portfolio in Brazil has been reviewed based on four main objectives: (i) build long-term capability for the market through education; (ii) create opportunities for local communities, contributing to a reduction in social inequality; (iii) engage the entire Equinor Brazil organisation and build internal pride, (iv) improve brand recognition and enhance Equinor\u2019s reputation in the local market. ", "Equinor Brazil has approved a new social investment initiative which is inspired and guided by the UN\u2019s ", "Sustainable Development Goals (SDGs), and our commitment to long-term sustainable value creation is in line with the principles of the SDGs. The main focus of the initiative is SDG 4 \u2013 Quality in education, with a goal to ensure inclusive and equitable education and promote lifelong learning for all. ", "Our Brazilian offshore operations impact fishermen due to a prohibition on fishing within safety zones around offshore installations. Since 2017 Equinor Brazil together with Shell have been running the Mar Atento project, a pilot ", "project in collaboration with local fishermen, providing oil spill response training. Through this engagement we strengthened our relationship with fishermen and their communities and developed a register of trained fishermen, ready to provide emergency response support. ", "In 2019, Equinor announced a new partnership with the Aberdeen Science Centre focusing on digitalisation and new technology. Equinor continues its support for NASA in Aberdeen and TechFest. In 2019, participation in the joint Heroes of Tomorrow event with TechFest was doubled to over 400 young people. ", "In 2019, the project was expanded to six municipalities on the Brazilian coast, with around 300 additional fishermen trained. The project is open for further expansion, to involve more oil operators as future partners. ", "Equinor Sustainability report 2019High value \u2014 creating shared valueEquinor Sustainability report 2019 High value \u2014 creating shared value"], "26": ["Creating shared value is one of the three key sustainability priorities that guides Equinor. Our management approach to shared value is described in the Equinor Book and internal policies. We aim to contribute to the development of communities where we have long-term operations. Together with our stakeholders and partners, we work to find mutual benefits and lasting solutions to common challenges and engage in dialogue with local communities to explain our actions and manage expectations. We assess the impact and outcome of our activities through received feedback, reviews and assurance activities, and set actions to improve when needed.", "We create shared value that contributes to sustainable development through:", "\u2022 Providing access to affordable, reliable, sustainable and modern energy \u2022 Creating value for shareholders \u2022 \u2022 Hiring and developing staff, and promotion of diversity and inclusion in our workforce \u2022 Creating opportunities for social and economic development across our value chain through payments to governments, ", "Innovation, research and development activities", "local job creation and local sourcing of goods and services", "\u2022 Purchasing goods and services \u2022 Management of social impacts and outcomes, and contributing to ripple effects ", "Economic value creation and distribution", "Social investments sponsorships & donations", "Equinor operates primarily in OECD countries. Hence, our economic contributions to society are primarily in the form of taxes and other payments to governments, purchases of goods and services, wages and employee benefits and dividends to shareholders, rather than social investments. ", "Creating shared value with communities Equinor\u2019s transition to a global energy company requires systematic development of competence and access to new talent. We empower our people to execute on business ambitions, while promoting personal growth and development. Through learning and development activities we prepare for increased digitalisation and new ways of working. As part of our long-term commitment to creating shared value, Equinor emphasises building skills and capacity in the communities where we have activities. A large portion of our sponsorships, donations and social investments is allocated to capacity building within science, technology, engineering and mathematics (STEM), through partnerships with academic institutions and support to science centres. Our academia collaboration with key universities increasingly addresses the energy transition and new energy solutions. Through our Heroes of Tomorrow programme, we give children and youth the opportunity to develop their talents within the areas of sports, culture and education. In 2019, our corporate sponsorships spend was USD 19.2 million.", "Teach First Norway is a two-year development programme for newly-educated talents holding a science degree. The programme was established 10 years ago as a partnership between the Oslo Education Agency, the University of Oslo and Equinor. Teach First Norway is working with talented M.Sc. graduates to become effective and inspiring teachers and leaders. Teach First candidates teach STEM subjects at selected schools in Oslo. At the same time, they receive formal teaching education (PPU) and leadership training. ", "We also create value for society through research, development and innovation. In 2019, our R&D expenditure was USD 300 million. Examples of how we collaborate with others to find new and innovative solutions are provided throughout the report. ", "Equinor Technology Ventures Equinor Technology Ventures supports small and medium enterprises (SMEs) with exciting new technologies in oil and energy\u2014and in turn, helps Equinor be the world\u2019s most carbon-efficient oil and gas producer with a developing renewable business. ", "Equinor Innovate Equinor Innovate is our dedicated channel to challenge- driven open innovation. We focus on connecting with institutions and companies that can help us find solutions to concrete business challenges. Ideas and solutions to improve and expand our business along three main opportunity areas, are especially welcome. Our three ", "opportunity areas are: Competitive at all times, Transforming the oil and gas industry, and Providing energy for a low carbon future. ", "Digitalisation Equinor\u2019s digital roadmap is progressing well. New digital technologies are implemented to help us reach our goals of improved safety performance, reduced emissions and higher value. The integrated operations support centre, established in 2018, will be central in reducing CO\u2082 emissions from the NCS. Equinor has so far connected 20 of its assets to this centre, streaming data to our cloud-based data platform. By end of 2020 all operated fields on the NCS will be connected. Cross-functional teams utilise this data to discover opportunities for energy efficiency measures, safety and value improvements. Another centre, the geo-operations centre, ensures more efficient and better geoscience control of drilling operations, as well as cost savings and improved personnel safety. Further, subsurface data are connected and analysed in new ways through our subsurface data lake, enhancing the reservoir performance. Our digital field worker concept is also being broadly implemented, allowing our operators and engineers easy access to data enabling improved safety performance, higher efficiency and reduced carbon footprint. Workforce diversity and inclusion Embracing diversity and driving inclusion is a fundamental part of our values - open, collaborative, courageous and caring - and an integral part of our leadership expectations. This includes working actively to ensure that everyone has equal opportunities at Equinor. In 2019, we continued to strengthen diversity and inclusion in Equinor by embedding it into our key human resources processes, such as recruitment, succession planning, performance management and leadership development. We monitor diversity in our workforce at all levels and locations and encourage and support employee initiatives that contribute to a diverse and inclusive culture. In 2019, we established guidelines to further support employee resource groups in Equinor, including Women in Equinor, Differently Abled and LGBTQ+ groups. ", "Diversity to us includes age, gender, nationality, experience, competence, education, cultural background, religion, ethnicity, sexual orientation and disabilities \u2013 everything that helps shape our thoughts and perspectives. Inclusion to us means that everyone in Equinor feel like that they are part of one team, are able to bring their whole self to work, and have their voices heard to perform at their best. We believe we can only leverage the value of diversity if ", "Equinor Sustainability report 2019 High value \u2014 creating shared value"], "27": ["we have an inclusive culture where everyone feel safe to contribute.", "support our agenda on diversity and inclusion and our general attractiveness as an employer.", "In 2019, Equinor implemented a corporate diversity and inclusion (D&I) KPI, which is measured at the team level. The KPI is based on a diversity index and an inclusion index. Our diversity index is flexible and holistic, meaning teams may focus on different dimensions of diversity to achieve the balance that adds most value to them. The diversity KPI monitors each business area\u2019s progression on team diversity. The Inclusion Index is measured in our Global People Survey, and measures employees\u2019 perception of inclusion in their teams. Our ambition is for all teams in Equinor to be diverse and inclusive by 2025. ", "To show our commitment to equal and inclusive workplaces, Equinor participated in several Gender Equality Indexes that aim to give more visibility into reporting on environmental, social and governance (ESG) from public companies. In 2019, we submitted our employees\u2019 gender profile for inclusion in the Bloomberg Gender-Equality Index, and the Norwegian SHE Index where Equinor was ranked number 10 out of 91 of Norway\u2019s largest companies.", "We continuously work on mitigating unconscious biases. During 2019, classroom and online training on unconscious bias was delivered across the organisation, including all top-level leadership teams and our external recruitment providers. We will continue to deliver training on this important topic in 2020. ", "In all our leadership activities, including talent and succession reviews, leadership assessments, leadership development courses and top-tier leadership deployment, we aim for gender balance and diversity. As a part of this, we pay close attention to positions and discipline areas dominated by employees of one gender. In 2019, both shares of female leaders at different levels as well as leaders with non-Norwegian background have increased and this indicates that our management approach related to diversity is contributing to improved diversity.", "Consistent with our values and to strengthen our brand and attractiveness as an employer, we successfully implemented a global parental leave policy in all Equinor companies and health insurance in Equinor ASA effective from January 2019. A minimum of 16 weeks paid leave is offered to all employees in the group becoming parents through birth or adoption. The health insurance scheme, supplementing public health services, offers access to private specialists, medical examinations and treatments, and is similar to local health insurance already provided in our subsidiaries. We expect the scheme to have a positive effect on employees\u2019 health and believe that both benefits ", "Developing our people As Equinor develops into a broad energy company and accelerates the use of digital solutions, our ability to drive people development is critical to the delivery of our business strategy. Building a culture of lifelong learning where our employees develop new skills faster to match changing job requirements, has been a key focus area in 2019. We continue to use deployment across the company as a strong tool for driving on-the-job learning. Through all the academies in The Equinor University we intensified our formal learning activities, particularly relating to safety and digitalisation. In 2019, we more than tripled our learning activities in digital topics, including the introduction of \u2018Digital Leadership\u2019 training for our leaders. In addition, we significantly increased learning activities across the company, using e-learning and virtual classrooms as a flexible, accessible and cost-effective means to increase participation. ", "Early Talents We continue to invest in our early talents through our graduate and apprentice programmes. In 2019, we welcomed 182 graduates and 157 apprentices. Through our recruitment and attraction activities we strive to increase the diversity of our early talent applicant base and hires, and our ambition was to achieve a 50-50 balance on gender and non-Norwegian background in 2019. In 2019, we made strides towards achieving this goal with a 43-57 split between female and male graduates recruited, and a 45-55 split between graduates recruited with a non- Norwegian and Norwegian background.", "Employee relations We believe in involving our people in the development of the company. In all countries where we are present, we involve our employees and/or their appropriate representatives according to local laws and practices. This varies from formal bodies with employee representatives to employee engagement and involvement through team or town hall meetings. ", "In 2019, we maintained close cooperation with employee representatives through formal and informal dialogue, at relevant levels and areas of the business. In our European Works Council, we discussed matters, such as Equinors strategy, human rights, safety, digitalisation, GDPR and future ways of working. In May 2019, we renewed our union agreement in Brazil, covering our onshore and offshore workers, and included an amendment covering specific regulations for offshore workers. Data on union membership figures is available in our sustainability performance data at Equinor.com.", "In our opinion the updated strategy for inclusion and diversity, makes the organisation more resilient for the future. We therefore do not see any need for an adjustment to the management approach. ", " Economic value created and distributed ", " Employment, recruitment and workforce diversity", "Total number of permanent employees", "Total number of permanent employees in non-OECD countries", "Permanent employees female (share of total)", "More data is available in our sustainability performance data and in our Payments to governments report, at Equinor.com.", "Corporate executive committee, business areas and business clusters Business unit leadersBusiness sector leadersBusiness department leadersProportion of women in leadership positions (percentage)020406020192018201720162015"], "28": ["Actual serious incident frequency (SIF)", "The number of serious incidents (per million hours worked). An incident is an event or chain of events that has caused or could have caused injury, illness and/or damage to/loss of property, the environment or a third party. All undesirable incidents are categorised according to the degree of seriousness, based on established categorisation matrices.", "Comprises Key biodiversity areas included in the World Database on Key Biodiversity Areas managed by International Union for Conservation of Nature (IUCN) and Particularly Valuable and Sensitive Areas (Srlig verdifulle og srbare omrder) on the Norwegian Continental Shelf.", "Board of Directors\u2019 Safety, Sustainability and Ethics committee.", "CO\u2082 released to the atmosphere as a result of our processes and activities, including CO\u2082 emissions from energy generation, heat production, flaring (including well testing/well work-over), and remaining emissions from carbon capture and treatment plants. Separate data compiled for Equinor operated activities and equity basis.", "Carbon dioxide equivalent is a quantity that describes, for a given mixture and amount of greenhouse gas, the amount of CO2 that would have the same global warming potential. ", "CDP is a not-for-profit charity that runs a global disclosure system for investors, companies, cities, states and regions to report and benchmark their environmental impacts.", "Includes cash dividend and scrip dividend.", "Extractives Industries Transparency Initiative. ", "Salaries, pensions, payroll tax and other compensations.", "European Union Emissions Trading System.", "The US national hydraulic fracturing chemical registry.", "Energy used for power generation and heat production in combustion processes, unused energy from flaring (including well testing/work-over and venting), energy sold/delivered to third parties and gross energy (heat and electricity) purchased.", "Naturally occurring water with a low concentration of salts, or generally accepted as suitable for abstraction and treatment to produce potable water. Includes water from public installations, wells (including groundwater reservoirs), lakes, streams, rivers and purchased fresh water. Fresh water produced from salt water on facilities/installations is not included.", "General Data Protection Regulation", "For Equinor, the relevant GHGs are CO\u2082 and methane (CH4). Other GHGs are not included as they are assessed to be non- material for Equinor. Equinor uses a global warming potential that is 25 times higher than CO\u2082 in a 100-year perspective for methane, aligned with industry reporting practice. ", "Waste is considered to be hazardous waste according to the regulations under which the activity operates or where the waste can pose a substantial hazard to human health and/or the environment when improperly managed.", "The total quantity of CO\u2082 injected into the subsurface for the purpose of storage or improved/enhanced oil recovery.", "The International association of Oil & Gas Producers. ", "The global oil and gas industry association for environmental and social issues. ", "Equinor Sustainability report 2019AppendicesEquinor Sustainability report 2019 Appendices"], "29": ["Low carbon and energy efficiency R&D expenditure", "The share of annual research expenditures, in percentages of total R&D expenditures, used on new energy solutions and energy efficiency technologies, including energy efficiency as secondary effect.", "The monetary charge or payment imposed on a Equinor entity for failure to comply with safety and environmental laws and regulations. Only fines paid by Equinor as an operator are included. Fines are reported for the financial year when the actual payment is made.", "CH4 released to the atmosphere including emissions from energy generation and heat production at own plants, flaring (including well testing/well work-over), cold venting, diffuse emissions, and the storage and loading of crude oil.", "Direct GHG emissions from operations that are owned and/or controlled by the organisation. ", "Total methane emissions from our up- and midstream activities divided by the marketed gas, both on a 100 % operated basis.", "GHG emissions associated with the production and use of energy produced by Equinor, including negative emissions related to carbon services and offsets, divided by the amount of energy produced by the company (gCO\u2082e/MJ). A detailed description of the net carbon intensity indicator is available at Equinor.com.", "Indirect GHG emissions from energy imported from third parties, heating, cooling, and steam consumed within the organisation. We use IEA (physical) and RE-DISS (market-based) as sources of scope 2 emissions factor, expressed as kg CO\u2082/kWh. A location-based calculation method reflects the average emissions intensity of grids (using mostly grid- average emission factor data). A market-based calculation method reflects emissions from electricity that companies have purposefully chosen (or their lack of choice). It derives emission factors from contracts between two parties for the sale and purchase of energy bundled with attributes about the energy generation, or for unbundled attribute claims. (Source: Greenhouse gas protocol). ", "Net profit after all revenues, income items and expenses, including tax, have been accounted for.", "Emissions from the use of products (GHG Protocol category 11) originating from Equinor\u2019s equity oil and gas production. Regional product spreads are assumed using IEA statistics. ", "Non-methane volatile organic compounds (nmVOC) emissions", "New Energy Solutions\u2019 (NES) gross capital expenditure, before including the effect of project financing.", "NOx released from power generation and heat production, flaring (including well testing/well work-over) and process.", "Waste that is not defined as hazardous waste. This excludes drill cuttings and produced and flow-back water from our USA onshore operations which are exempted from regulation and are registered separately as \u2018exempted waste\u2019.", "nmVOC released to the atmosphere from power generation and heat production, flaring (including well testing/well work-over), process, cold venting and fugitives.", "Temporary or permanent sites, activities and assets used for exploration, extraction, refining, transporting, distributing, and marketing petroleum products.", "Unintentional spills of chemicals, produced water, ballast water and polluted water reaching the natural environment.", "Payments made directly by Equinor to governments, such as income tax, host government entitlements (value), bonuses, royalties and fees, related to exploration and production activities. Includes environmental fees and taxes. Payments made on behalf of other license partners, e.g. area fees, are included.", "Water that is brought to the surface during operations which extract hydrocarbons from oil and gas reservoirs.", "A protected area is a clearly defined geographical space, recognised, dedicated and managed, through legal or other effective means, to achieve the long term conservation of nature with associated ecosystem services and cultural values. (IUCN Definition 2008).", "Part of the cost is charged to partners in activities we operate.", "The psychosocial work environment concerns aspects of the design and management of work and its social and organisational context that could have an impact on the employee\u2019s health and well-being.", "Waste from Equinor operated activities that has been delivered for reuse, recycling or incineration with energy recovery.", "Oil in regulated or controlled discharges to the sea from Equinor operated activities. This includes produced water, process water, displacement water, ballast water, jetting water, drainage water and water discharged from treatment plants. ", "Total revenues including income from sales of liquids on behalf of the Norwegian state\u2019s direct financial interest.", "The United Nations\u2019 Sustainable Development Goals.", "The International Energy Agency\u2019s (IEA) Sustainable Development Scenario. ", "A monitoring and mapping programme for Norwegian seabirds (SEAbird POPulations). ", "The number of serious incidents (including near misses) per million hours worked. An incident is an event or chain of events that has caused or could have caused injury, illness and/or damage to/loss of property, the environment or a third party. All undesirable incidents are categorised according to degree of seriousness, based on established categorisation matrices.", "Share of production in areas of high water stress", "The share in % of Equinor\u2019s operated production in areas of high or extremely high baseline water stress, versus Equinor\u2019s total operated production. World Resources Institute\u2019s Aqueduct tool is used to determine baseline water stress, which is the ratio of total annual water withdrawal from a catchment to average annual available water to the same catchment. The Aqueduct tool classifies stress into five levels, Low, Low-medium, Medium-high, High and Extremely high. (Aqueduct indicator: Baseline Water Stress).", "The total number of sickness absence hours as a percentage of planned working hours (Equinor ASA employees).", "Includes voluntary and contractual payments. Part of the cost is charged to partners in activities we operate. Contractual social investments include the contributions that we are required to pay under the terms of the production sharing agreements (PSA) or contracts or host government agreements or national laws.", "Science, technology, engineering and mathematics. ", "SOx released from power generation and heat production, flaring and process.", "Task Force on Climate-related Financial Disclosures. ", "Total recordable injury frequency (TRIF)", "Number of fatal accidents, lost-time injuries, injuries involving substitute work and medical treatment injuries per million hours worked.", "United Nations Guiding Principles on Business and Human Rights", "Upstream carbon dioxide (CO\u2082 ) emission intensity", "Total scope one emissions of CO\u2082 (kg CO\u2082) from exploration and production, divided by total production (boe).", "Voluntary Principles on Security and Human Rights.", "Materials are defined as waste when; they are classified as such according to the regulations under which the activity operates or where the material is contained and intended to be transported for further handling and/or re-use or disposal by a 3rd party. Residual materials from industrial activity, which are discharged, recycled, injected or reused at the place of generation as part of the consented operations, are not included.", "Number of WRI incidents that result in death, serious WRI, WRI that results in treatment from authorized health care personnel and other WRI per million of hours worked. For Equinor employees and contractors.", "Equinor Sustainability report 2019AppendicesEquinor Sustainability report 2019 Appendices"], "30": ["Task Force on Climate-related Financial Disclosures (TCFD) reference index", "Governance \u2013 Disclose the organisation\u2019s governance around climate-related risks and opportunities", "a) Describe the board\u2019s oversight of climate-related ", "b) Describe management\u2019s role in assessing and managing ", "climate-related risks and opportunities. ", "\u2022 AR 3.9 \u2013 The work of the Board of Directors \u2022 SR \u2013 Embedding sustainability in how we work \u2022 SR \u2013 Climate-related business risks and portfolio resilience ", "\u2022 AR 3.10 \u2013 Risk management and internal control \u2022 SR \u2013 Embedding sustainability in how we work \u2022 SR \u2013 Climate-related business risks and portfolio resilience ", "Strategy \u2013 Disclose the actual and potential impacts of climate-related risks and opportunities on the organisation\u2019s businesses, strategy, and financial planning where such information is material ", "a) Describe the climate-related risks and opportunities the ", "organisation has identified over the short, medium, and long term. ", "\u2022 AR 2.11 \u2013 Risk review \u2022 SR \u2013 Climate-related business risks and portfolio resilience \u2022 Equinor\u2019s CDP 2019 response ", "b) Describe the impact of climate-related risks and opportunities on the organisation\u2019s businesses, strategy, and financial planning. ", "\u2022 AR 2.12 \u2013 Safety, security and sustainability \u2013 Portfolio sensitivity test \u2022 SR \u2013 Climate-related business risks and portfolio resilience \u2013 ", "c) Describe the resilience of the organisation\u2019s strategy, taking into ", "consideration different climate-related scenarios, including a 2C or lower scenario. ", "\u2022 AR 2.12 \u2013 Safety, security and sustainability \u2013 Portfolio sensitivity test \u2022 SR \u2013 Climate-related business risks and portfolio resilience \u2022 Equinor\u2019s Energy Perspectives 2019", "Risk management \u2013 Disclose how the organisation identifies, assesses, and manages climate-related risks ", "a) Describe the organisation\u2019s processes for identifying and assessing ", "\u2022 AR 2.11 \u2013 Risk review \u2013 Risk management \u2022 SR \u2013 Embedding sustainability in how we work \u2022 SR \u2013 Climate-related business risks and portfolio resilience \u2022 Equinor\u2019s 2019 CDP response ", "b) Describe the organisation\u2019s processes for managing ", "c) Describe how processes for identifying, assessing, and managing climate-related risks are integrated into the organisation\u2019s overall risk management. ", "Metrics and targets \u2013 Disclose the metrics and targets used to assess and manage relevant climate-related risks and opportunities where such information is material ", "a) Disclose the metrics used by the organisation to assess ", "climate-related risks and opportunities in line with its strategy and risk management process. ", "\u2022 AR 2.12 \u2013 Safety, security and sustainability \u2022 SR\u2013 Climate performance \u2022 SR \u2013 Climate-related business risks and portfolio resilience \u2013 ", "\u2022 Sustainability performance data at equinor.com", "b) Disclose Scope 1, Scope 2, and, if appropriate, Scope 3 greenhouse gas ", "\u2022 AR 2.12 \u2013 Safety, security and sustainability \u2022 SR \u2013 Climate performance ", "c) Describe the targets used by the organisation to manage climate-related ", "risks and opportunities and performance against targets. ", "Statsautoriserte revisorer Ernst & Young AS Dronning Eufemias gate 6, NO-0191 Oslo Postboks 1156 Sentrum, NO-0107 Oslo ", "Tlf: +47 24 00 24 00 Fax: www.ey.no Medlemmer av Den norske revisorforening ", "Independent assurance report \u2013 Reporting on Sustainability for 2019 ", "We have performed an independent verification of Equinor ASA\u2019s reporting on Sustainability for 2019 (the Report) as Equinor has defined in its 2019 GRI standards index and on page 5 of the Sustainability Report. Our review includes data from Equinor ASA\u2019s 2019 Sustainability Report and figures presented in the Sustainability Datahub as shown in the GRI Index. We have assessed if the information being presented in the Report is based on relevant criteria from the GRI (Global Reporting Initiative) sustainability reporting standards, GRI Standards option core. Controlled information is shown in the company's GRI index, see https://www.equinor.com/en/how-and- why/sustainability/sustainability-reports.html. ", "The CEO and Executive Management are responsible for the selection of the information and collection of the data for presentation and for the preparation of the Report in accordance with the applicable criteria. The criteria are defined on page 5 in the Sustainability Report and are based on the Sustainability Reporting Guidelines published by GRI that are applicable to the Report, as well as the accounting and calculation principles that Equinor ASA has developed. This responsibility includes the internal control relevant to the preparation of a Report that is free from material misstatements, whether due to fraud or error. ", "Our Independence and Quality Control ", "We are independent of the company as required by law and regulations and have complied with our other ethical obligations in accordance with these requirements. We apply the International Standard on Quality Control (ISQC 1) and maintain a comprehensive system of quality control including documented policies and procedures regarding compliance with ethical requirements, professional standards and applicable legal and regulatory requirements. ", "Auditor\u2019s tasks and duties Our task is to issue an independent report to the CEO on the Reporting on Sustainability based on our work. Our work is conducted in accordance with ISAE 3000 Assurance Engagements Other than Audits or Reviews of Historical Financial Information. This engagement consists of two parts a limited assurance engagement and a reasonable assurance of selected disclosures. A limited assurance engagement is different from and substantially less in scope than reasonable assurance engagement conducted in accordance with IAASB\u2019s Standards on Auditing and other generally accepted auditing standards. ", "Limited assurance engagement The engagement includes a limited assurance engagement on the complete Sustainability Report, excluding forward looking information related to the climate-related business risks and portfolio resilience chapter, as shown in the GRI index. A limited assurance engagement consists of making inquiries, primarily of persons responsible for the preparation of the Report and applying analytical and other limited assurance procedures. ", "To obtain limited assurance we have performed the following procedures: ", "\uf0b7 Review of Equinor ASA\u2019s process for the preparation and presentation of the Reporting on Sustainability to ", "provide us with an understanding of how Sustainability is ensured in practice within the business Interviewing those in charge of Sustainability reporting to develop an understanding of the process for the preparation of the Reporting on Sustainability ", "\uf0b7 Verifying on a sample basis the information in the Reporting on Sustainability against source data and other ", "information prepared by Equinor ASA ", "A member firm of Ernst & Young Global Limited ", "Equinor Sustainability report 2019AppendicesEquinor Sustainability report 2019 Appendices"], "31": ["\uf0b7 Assessing the overall presentation of Reporting on Sustainability against the criteria in GRI Standards", "including a review of the consistency of information against the GRI index.", "The engagement also included a reasonable assurance engagement on the data that is specified below, as shown in the GRI index. A reasonable assurance engagement includes examining, on a test basis, evidence supporting the quantitative and qualitative information in the Report. ", "We have additionally performed controls in order to establish a reasonable level of assurance for a selection of disclosures as defined by Equinor for own controlled operations as listed below: ", "\uf0b7 Disclosures on safety: Total recordable injury frequency (TRIF), Serious incident frequency (SIF), Fatalities,", "\uf0b7 Disclosures on climate and environment: emissions of Carbon dioxide, Methane, NOx and SOx; and energy", "Oil spills, Serious oil and gas leakages;", "In addition to the previously mentioned procedures, for the reasonable assurance engagement we also performed the additional procedures: ", "\uf0b7 One physical site visits and in-depth interviews with three Equinor locations in order to gather and review", "underlying data and confirm the implementation of the processes and controls related to the preparation of the selected safety and environmental KPIs", "\uf0b7 Recalculating the safety and climate KPIs and evaluating the reasonableness of estimates made by Equinor \uf0b7 Reviewing the trend and explanations submitted by sites and prepared at corporate level \uf0b7", "Interviewing relevant staff with responsibility for preparing the sustainability data at corporate, business area and local area, including those with responsibility for carrying out internal control procedures on the data and consolidating the data for the sustainability report", "\uf0b7 Confirming agreement of the CO2 reporting for Norway with the preliminary EUETS reporting", "In our opinion, the evidence obtained is sufficient and appropriate to provide a basis for our conclusion. ", "Conclusion For the limited assurance engagement, nothing has come to our attention that causes us to believe that the Sustainability Report is not prepared, in all material respects, in accordance with GRI and the criteria defined by the CEO and Executive Management. ", "For the reasonable assurance engagement it is our opinion that the disclosures on safety: Total recordable injury frequency (TRIF), Serious incident frequency (SIF), Fatalities, Oil spills, Serious oil and gas leakages; and disclosures on climate and environment: emissions of Carbon dioxide, Methane, NOx and SOx; and energy consumption have, in all material respects, been prepared in accordance with the criteria defined by the CEO and Executive Management. ", "Erik Mamelund State Authorised Public Accountant ", "Independent assurance report \u2013 Equinor ASA", "A member firm of Ernst & Young Global Limited ", "Photography Ole Jrgen Bratland/Arne Reidar Mortensen/Equinor ASA. ", "Einar Aslaksen. David Gustav Tvetene. ivind Haug.", "Illustrations and design Equinor ASA.", "This report contains certain forward-looking statements that involve risks and uncertainties. In some cases, we use words such as aim, ambition, continue, expect, may, strategy, will, in line with, and similar expressions to identify forward-looking statements. Forward-looking statements include all statements other than statements of historical fact, including, among others, statements regarding Equinor\u2019s ambitions, plans, intentions, aims and expectations with respect to Equinor\u2019s new climate roadmap, including with respect to its net carbon intensity, carbon efficiency, methane emissions and flaring reductions, renewable energy capacity, carbon-neutral global operations, internal carbon price on investment decisions, future levels of, and expected value creation from, oil and gas production, scale and composition of the oil and gas portfolio, development of CCUS and hydrogen businesses, use of offset mechanisms and natural sinks and support of TCFD recommendations.", "These forward-looking statements reflect current views about future events and are, by their nature, subject to significant risks and uncertainties because they relate to events and depend on circumstances that will occur in the future and are beyond Equinor\u2019s control and are difficult to predict, including societal shifts in consumer demand and technological advancements. Although we believe that the expectations reflected in such forward-looking statements are reasonable, we cannot assure you that future results will meet these expectations. You should therefore not place undue reliance on these forward-looking statements. Actual results could differ materially from those anticipated in these forward-looking statements for many reasons. Equinor does not assume any responsibility for the accuracy and completeness of any forward-looking statements. Any forward-looking statement speaks only as of the date on which such statement is made. Unless required by law, we will not necessarily update any of these statements.", "Equinor is including the emissions from a customer\u2019s product use in its calculation of its net carbon intensity solely as a means to (i) more accurately evaluate the emission lifecycle of what we produce and (ii) to respond to the potential business opportunities arising from shifting consumer demands. Including these emissions in the calculation should in no way be construed as an acceptance by Equinor of responsibility for the emissions caused by such use.", "Additional information, including information on factors that may affect Equinor\u2019s business, is contained in Equinor\u2019s latest Annual Report and Form 20-F, filed with the U.S. Securities and Exchange Commission (and section Risk review \u2013 Risk factors thereof), which is available at Equinor\u2019s website (www.equinor.com).", "Equinor Sustainability report 2019AppendicesEquinor Sustainability report 2019 Appendices"], "32": ["Equinor ASA Box 8500 NO-4035 Stavanger Norway Telephone: +47 51 99 00 00 www.equinor.com"]} diff --git a/data/pdfs/ESG/sustainability-report-2019.pdf b/data/pdfs/ESG/sustainability-report-2019.pdf new file mode 100755 index 0000000..b295d59 Binary files /dev/null and b/data/pdfs/ESG/sustainability-report-2019.pdf differ diff --git a/notebooks/demo2/pdf_text_extraction.ipynb b/notebooks/demo2/pdf_text_extraction.ipynb new file mode 100644 index 0000000..c837c93 --- /dev/null +++ b/notebooks/demo2/pdf_text_extraction.ipynb @@ -0,0 +1,100 @@ +{ + "cells": [ + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# Text Extraction\n", + "As a first step of the pipeline, we aim to extract text from PDFs in this notebook. The input PDFs for this notebook is in the `ROOT/data/pdfs` directory and the output json will be stored in `ROOT/data/extract` directory. The output from this notebook combined with the annotations will be used in the next step of curation." + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "# Author: ALLIANZ NLP esg data pipeline\n", + "from src.components.preprocessing import Extractor\n", + "import src.components.config as config" + ] + }, + { + "cell_type": "code", + "execution_count": 2, + "metadata": {}, + "outputs": [], + "source": [ + "PDF_FOLDER = config.BASE_PDF_FOLDER\n", + "EXT_FOLDER = config.BASE_EXTRACTION_FOLDER" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### Call text extracter" + ] + }, + { + "cell_type": "code", + "execution_count": 3, + "metadata": {}, + "outputs": [], + "source": [ + "PDFTextExtractor_kwargs = {\n", + " \"min_paragraph_length\": 30,\n", + " \"annotation_folder\": None,\n", + " \"skip_extracted_files\": False,\n", + "}" + ] + }, + { + "cell_type": "code", + "execution_count": 4, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "['/home/shanand/aicoe-osc-demo/data/pdfs/ESG/sustainability-report-2019.pdf']\n" + ] + } + ], + "source": [ + "ext = Extractor([(\"PDFTextExtractor\", PDFTextExtractor_kwargs)])\n", + "ext.run_folder(PDF_FOLDER, EXT_FOLDER)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### Conclusion\n", + "We called the Extractor class to extract text from the PDF and store the ouput in the `ROOT/data/extraction` folder." + ] + } + ], + "metadata": { + "kernelspec": { + "display_name": "Python 3", + "language": "python", + "name": "python3" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.7.3" + } + }, + "nbformat": 4, + "nbformat_minor": 4 +} diff --git a/src/__init__.py b/src/__init__.py index 408f7ee..e69de29 100644 --- a/src/__init__.py +++ b/src/__init__.py @@ -1 +0,0 @@ -"""Analytics compiled into python code.""" diff --git a/src/components/config.py b/src/components/config.py new file mode 100644 index 0000000..75541c0 --- /dev/null +++ b/src/components/config.py @@ -0,0 +1,92 @@ +import os +import src +import pathlib +import torch + +# General config +STAGE = "extract" # "extract" | "curate " +SEED = 42 + +ROOT = pathlib.Path(src.__file__).resolve().parent.parent +CONFIG_FOLDER = ROOT / "config" +CHECKPOINT_FOLDER = ROOT / "checkpoint" +# the data for demo notebooks is located at sample_data directory +DATA_FOLDER = ROOT / "data" +BASE_PDF_FOLDER = DATA_FOLDER / "pdfs" +BASE_ANNOTATION_FOLDER = DATA_FOLDER / "annotations" +BASE_EXTRACTION_FOLDER = DATA_FOLDER / "extraction" +BASE_CURATION_FOLDER = DATA_FOLDER / "curation" + + +if not os.path.exists(BASE_EXTRACTION_FOLDER): + os.mkdir(BASE_EXTRACTION_FOLDER) +if not os.path.exists(BASE_CURATION_FOLDER): + os.mkdir(BASE_CURATION_FOLDER) + +ckpt = "icdar_19b2_v2.pth" if "cpu" in torch.__version__ else "icdar_19b2.pth" +config_file = ( + "cascade_mask_rcnn_hrnetv2p_w32_20e_coco.py" + if "cpu" in torch.__version__ + else "cascade_mask_rcnn_hrnetv2p_w32_20e.py" +) +PDFTableExtractor_kwargs = { + "batch_size": -1, + "cscdtabnet_config": CONFIG_FOLDER / config_file, + "cscdtabnet_ckpt": CHECKPOINT_FOLDER / ckpt, + "bbox_thres": 0.85, + "dpi": 200, +} + +# PDFTextExtractor +PDFTextExtractor_kwargs = { + "min_paragraph_length": 30, + # Set to ANNOTATION_FOLDER if you want to extract just pdfs mentioned in the annotations + # Set to None to extract all pdfs in pdf folder (for production stage) + "annotation_folder": None, + "skip_extracted_files": False, +} + +TableCurator_kwargs = { + "neg_pos_ratio": 1, + "create_neg_samples": True, + "columns_to_read": [ + "company", + "source_file", + "source_page", + "kpi_id", + "year", + "answer", + "data_type", + ], + "company_to_exclude": ["CEZ"], + "seed": SEED, +} + +TextCurator_kwargs = { + "retrieve_paragraph": False, + "neg_pos_ratio": 1, + "columns_to_read": [ + "company", + "source_file", + "source_page", + "kpi_id", + "year", + "answer", + "data_type", + "relevant_paragraphs", + ], + "company_to_exclude": [], + "create_neg_samples": True, + "seed": SEED, +} + +# Components +EXTRACTORS = [ + # ("PDFTableExtractor", PDFTableExtractor_kwargs), + ("PDFTextExtractor", PDFTextExtractor_kwargs) +] + +CURATORS = [ + ("TextCurator", TextCurator_kwargs) + # ,("TableCurator", TableCurator_kwargs) +] diff --git a/src/components/preprocessing/__init__.py b/src/components/preprocessing/__init__.py new file mode 100755 index 0000000..a3ebb46 --- /dev/null +++ b/src/components/preprocessing/__init__.py @@ -0,0 +1,9 @@ +from .base_component import BaseComponent # noqa F401 +from .pdf_table_extractor import PDFTableExtractor # noqa F401 +from .pdf_text_extractor import PDFTextExtractor # noqa F401 +from .extractor import Extractor # noqa F401 +from .nq_extractor import NQExtractor # noqa F401 +from .nq_curator import NQCurator # noqa F401 +from .curator import Curator # noqa F401 +from .text_curator import TextCurator # noqa F401 +from .table_curator import TableCurator # noqa F401 diff --git a/src/components/preprocessing/base_component.py b/src/components/preprocessing/base_component.py new file mode 100755 index 0000000..e503e5f --- /dev/null +++ b/src/components/preprocessing/base_component.py @@ -0,0 +1,10 @@ +from abc import ABC, abstractmethod + + +class BaseComponent(ABC): + def __init__(self, name="Base"): + self.name = name + + @abstractmethod + def run(self, *args, **kwargs): + pass diff --git a/src/components/preprocessing/base_curator.py b/src/components/preprocessing/base_curator.py new file mode 100755 index 0000000..c465670 --- /dev/null +++ b/src/components/preprocessing/base_curator.py @@ -0,0 +1,42 @@ +import re +from abc import abstractmethod + +from .base_component import BaseComponent + + +# Remember to also implement BaseComponent's abstract methods for child classes +# of this class +class BaseCurator(BaseComponent): + def __init__(self, name="BaseCurator"): + self.name = name + + @abstractmethod + def process_single_annotation_file(self, annotation_filepath, *args, **kwargs): + pass + + @abstractmethod + def create_pos_examples(self, row, *args, **kwargs): + pass + + @abstractmethod + def create_negative_examples(self, row, *args, **kwargs): + pass + + @staticmethod + def clean_text(text): + """ + Clean text + + Args: + text (A str) + """ + # Substitute unusual quotes at the start of the string with usual quotes + text = re.sub("(?<=\[)“", '"', text) # noqa W605 + # Substitute unusual quotes at the end of the string with usual quotes + text = re.sub("”(?=\])", '"', text) # noqa W605 + # Substitute th remaining unusual quotes with space + text = re.sub("“|”", "", text) + text = re.sub("\n|\t", " ", text) + text = re.sub(r"[\x00-\x08\x0b\x0c\x0e-\x1f\x7f-\xff]", "", text) + text = re.sub(r"\s{2,}", " ", text) + return text diff --git a/src/components/preprocessing/curator.py b/src/components/preprocessing/curator.py new file mode 100755 index 0000000..240f736 --- /dev/null +++ b/src/components/preprocessing/curator.py @@ -0,0 +1,50 @@ +import glob +import logging + +from .text_curator import TextCurator +from .table_curator import TableCurator + +logger = logging.getLogger(__name__) +NAME_CLASS_MAPPING = {"TextCurator": TextCurator, "TableCurator": TableCurator} + + +class Curator: + """A data curator component responsible for creating table and text training data based on annotated data + Args: + annotation_folder (str): path to the folder containing annotation excel files + """ + + def __init__(self, curators): + self.curators = self.__create_curators(curators) + + def __create_curators(self, curators): + """ + Returns a list of curator objects + + Args: + curators (A list of str) + """ + list_cura = [] + for cura in curators: + try: + cura_obj = NAME_CLASS_MAPPING[cura[0]](**cura[1]) + except KeyError: + raise ValueError("{} is an invalid extractor".format(cura[0])) + + list_cura.append(cura_obj) + + return list_cura + + def run(self, input_extraction_folder, annotation_folder, output_folder): + """Runs curation for each curator. + + Args: + input_extraction_folder (A str or PosixPath) + annotation_folder (A str or PosixPath) + output_folder (A str or PosixPath) + """ + annotation_excels = glob.glob("{}/[!~$]*[.xlsx]".format(annotation_folder)) + logger.info("Received {} excel files".format(len(annotation_excels))) + + for curator_obj in self.curators: + curator_obj.run(input_extraction_folder, annotation_excels, output_folder) diff --git a/src/components/preprocessing/extractor.py b/src/components/preprocessing/extractor.py new file mode 100755 index 0000000..eeb7c2c --- /dev/null +++ b/src/components/preprocessing/extractor.py @@ -0,0 +1,63 @@ +from .pdf_table_extractor import PDFTableExtractor +from .pdf_text_extractor import PDFTextExtractor +import logging + +_logger = logging.getLogger(__name__) +NAME_CLASS_MAPPING = { + "PDFTextExtractor": PDFTextExtractor, + "PDFTableExtractor": PDFTableExtractor, +} + + +class Extractor: + def __init__(self, extractors): + """ + A pipeline extractor which combines different types of extractors + + Args: + extractors (A list of tuples): (Name of extractor, kwargs_dict) + """ + self.extractors = self.__create_extractors(extractors) + + def __create_extractors(self, extractors): + """Returns a list of extractors objects + + Args: + extractors (A list of str) + """ + list_ext = [] + for ext in extractors: + try: + ext_obj = NAME_CLASS_MAPPING[ext[0]](**ext[1]) + except KeyError: + raise ValueError("{} is an invalid extractor".format(ext[0])) + + list_ext.append(ext_obj) + + return list_ext + + def run(self, input_filepath, output_folder): + """ + Extract a single file + + Args: + input_filepath (str): Input file path + output_folder (str): Output folder path + + """ + _logger.info("Running all extractors...") + + for ext in self.extractors: + _ = ext.run(input_filepath, output_folder) + + def run_folder(self, input_folder, output_folder): + """ + Extract for all files mentioned in folder. + (The logic is based on each child.) + + Args: + input_folder (A str): Input folder path + output_folder (A str): Output folder path + """ + for ext in self.extractors: + ext.run_folder(input_folder, output_folder) diff --git a/src/components/preprocessing/nq_curator.py b/src/components/preprocessing/nq_curator.py new file mode 100755 index 0000000..63e547c --- /dev/null +++ b/src/components/preprocessing/nq_curator.py @@ -0,0 +1,240 @@ +import logging +import os +from ast import literal_eval +from glob import glob +from multiprocessing import Pool, cpu_count + +import pandas as pd +import tqdm + +from src.components.utils.nq_utils import ( + get_text_section, + remove_html_tags, + contains_table, + is_not_short, +) +from .base_component import BaseComponent + +logger = logging.getLogger(__name__) + + +class NQCurator(BaseComponent): + """Component that creates balanced datasets for text and table data from the extracted NQ data + Args: + input_dir(str): The directory where the extracted CSVs are located. + output_dir(str): The directory where the curated CSVs will be saved. + extract_text(bool): Set to True to curate the table data + extract_tables(bool): Set to True to curate the text data + negative_from_other_docs(bool): If set to True, the negative examples are sampled from paragraphs from + the same document from which the positive examples are taken from. If False, they will be sampled from + other documents. + + """ + + def __init__( + self, + input_dir, + output_dir, + extract_text, + extract_tables, + negative_from_other_docs=True, + name="NQCurator", + ): + super().__init__(name) + self._input_dir = input_dir + self._output_dir = output_dir + self._extract_text = extract_text + self._extract_tables = extract_tables + self._negative_from_other_docs = negative_from_other_docs + + @staticmethod + def _extract_paragraphs(df): + """Extracts the content of the relevant and candidate answer paragraphs from the token start and end indices + Args: + df(Pandas dataframe): The input dataframe. + Returns: + df(Pandas dataframe): Same dataframe as the input, with two additional columns: `document_text` and + `other_long_answer_candidates` + """ + logger.info("Extracting relevant paragraphs...") + df["relevant_excerpt"] = [ + get_text_section(doc_tokens) + for doc_tokens in tqdm.tqdm( + zip( + df["document_text"].tolist(), + df["long_answer_start"].tolist(), + df["long_answer_end"].tolist(), + ), + total=len(df), + ) + ] + + logger.info("Extracting other long answer candidates...") + process_count = cpu_count() - 1 + with Pool(process_count) as p: + all_other_candidates = [ + list( + p.map( + get_text_section, + [(doc, p["start_token"], p["end_token"]) for p in paras], + ) + ) + for (doc, paras) in tqdm.tqdm( + zip( + df["document_text"].tolist(), + df["other_long_answer_candidates"].tolist(), + ), + total=len(df), + ) + ] + + df["other_candidates"] = all_other_candidates + + return df + + @staticmethod + def create_relevance_dataset(input_df): + """ + Process NQ dataset to get both a text dataset and a table dataset to train a + relevance classifier + Args: + input_df (dataframe): original NQ dataset loaded using jsonl_to_df + Returns: + df_text (dataframe): A dataframe containing the questions, positive and negative paragraph examples, + and the labels + df_table (dataframe): A dataframe containing the questions, positive and negative table examples, + and labels + """ + + # Create dataframe with only question, text and label + logger.info("Creating relevance dataframe") + all_data = [ + {"question": q, "text": t, "label": 1} + for (q, t) in zip(input_df["question_text"], input_df["relevant_excerpt"]) + ] + all_data += [ + {"question": q, "text": t, "label": 0} + for (q, texts) in zip( + input_df["question_text"], input_df["other_candidates"] + ) + for t in texts + ] + + del input_df + df_relevance = pd.DataFrame(all_data) + + df_relevance["with_table"] = df_relevance["text"].map(contains_table) + + # Changed df_relevance[(df_relevance["with_table"] == True)] to this + df_table = df_relevance[df_relevance["with_table"]].copy() + df_text = df_relevance.drop(df_table.index).reset_index(drop=True).copy() + df_table = df_table.reset_index(drop=True) + + df_table.drop(columns="with_table", inplace=True) + df_text.drop(columns="with_table", inplace=True) + + # Remove HTML tags + logger.info("Removing HTML tags...") + df_text["text"] = df_text["text"].map(remove_html_tags) + + # Remove too short paragraphs + logger.info("Removing short paragraphs...") + df_text = df_text[df_text["text"].map(is_not_short)] + + df_text = df_text.reset_index(drop=True) + + # Keep only questions that have both positive and negative samples after + # filtering + groups = df_text.groupby("question") + df_text = groups.filter( + lambda x: (1 in list(x["label"])) & (0 in list(x["label"])) + ) + + return df_text, df_table + + def _build_balanced_dataset(self, df): + """ + Select negative samples to build a balanced NQ relevance dataset and save it + to csv + Args: + df (dataframe): Processed NQ data with text only or table only data + (output of to_relevance_dataset() method) + Returns: + balanced_dataset (dataframe) + """ + + # Get positive samples + positive_samples = df.loc[df.label == 1].reset_index(drop=True) + # Get negative candidates + negative_candidates = df.loc[df.label == 0].reset_index(drop=True) + # Shuffle all the candidates + negative_candidates = negative_candidates.sample( + frac=1, random_state=42 + ).reset_index(drop=True) + # Select one negative candidate per question + negative_samples = negative_candidates.groupby("question").first().reset_index() + + if self._negative_from_other_docs: + # Shuffle the questions + new_questions = ( + negative_samples["question"] + .sample(frac=1, random_state=42) + .reset_index(drop=True) + ) + # Assign new questions to the selected negative candidates + negative_samples["question"] = new_questions + + balanced_dataset = ( + pd.concat([positive_samples, negative_samples]) + .sample(frac=1, random_state=42) + .reset_index(drop=True) + ) + return balanced_dataset + + def _run(self, df_path): + """The run method for a single chunk of data. Will curate a text and a table dataset from the `df_path` + Args: + df_path(str): Path to the CSV where the chunk of parsed data is saved at + Returns: + df_text_balanced(Pandas df): A dataframe with equal number of pos and neg text examples + df_table_balanced(Pandas df): A dataframe with equal number of pos and neg table examples + """ + df = pd.read_csv( + df_path, converters={"other_long_answer_candidates": literal_eval} + ) + df = self._extract_paragraphs(df) + df_text, df_table = self.create_relevance_dataset(df) + + df_text_balanced = ( + self._build_balanced_dataset(df_text) if self._extract_text else None + ) + df_table_balanced = ( + self._build_balanced_dataset(df_table) if self._extract_tables else None + ) + + return df_text_balanced, df_table_balanced + + def run(self): + """Loads all the extracted CSVs, and processes them one by one, curating a text and a table dataset from each + The datasets are then aggregated and saved as CSV. + """ + logger.info("Running the Curation stage") + logger.info("=" * 30) + processed_files_paths = sorted(glob(os.path.join(self._input_dir, "*.csv"))) + list_df_text_balanced = [] + list_df_table_balanced = [] + for path in processed_files_paths: + df_text_balanced, df_table_balanced = self._run(path) + list_df_text_balanced.append(df_text_balanced) + list_df_table_balanced.append(df_table_balanced) + + if self._extract_text: + df_text_agg = pd.concat(list_df_text_balanced) + df_text_agg.to_csv( + os.path.join(self._output_dir, "NQ_text_relevance_balanced.csv") + ) + if self._extract_tables: + df_table_agg = pd.concat(list_df_table_balanced) + df_table_agg.to_csv( + os.path.join(self._output_dir, "NQ_table_relevance_balanced.csv") + ) diff --git a/src/components/preprocessing/nq_extractor.py b/src/components/preprocessing/nq_extractor.py new file mode 100755 index 0000000..f0e3a15 --- /dev/null +++ b/src/components/preprocessing/nq_extractor.py @@ -0,0 +1,130 @@ +import json +import logging +import os + +import pandas as pd +import tqdm + +from .base_component import BaseComponent + +logger = logging.getLogger(__name__) + + +class NQExtractor(BaseComponent): + """ + The component to load the .jsonl files into a dataframe in chunks, extract the long answer candidates, and save + each chunk as a CSV. + Args: + raw_nq_json_file(str): Path to the raw NQ JSONL file + out_dir(str): Path to the directory where the parsed CSV files will be saved in + nrwos(int): Number of examples to parse. Set to -1 to parse all. + drop_no_long_answer(bool): Drop the examples that don't have a long answer + chunk_size(int): Number of parsed examples to be grouped together and saved in a CSV file + """ + + def __init__( + self, + raw_nq_json_file, + out_dir, + n_rows=-1, + drop_no_long_answer=True, + chunk_size=10000, + name="NQExtractor", + ): + super().__init__(name) + self._raw_nq_json_file = raw_nq_json_file + self._out_dir = out_dir + self._n_rows = n_rows + self._drop_no_long_answer = drop_no_long_answer + self._chunk_size = chunk_size + + def _write_chunk_to_disk(self, chunk_data, chunk_idx): + """Helper function to save a chunk of data to a CSV file""" + df = pd.DataFrame(chunk_data).fillna(-1) + output_path = os.path.join(self._out_dir, "Parsed_NQ_{}.csv".format(chunk_idx)) + df.to_csv(output_path) + + def run(self): + """ + Simple utility function to load the .jsonl files into a dataframe, and ex- + tract long answer candidates + Returns: + A Dataframe containing the following columns: + * document_text (str): The document split by whitespace + * question_text (str): the question posed + * yes_no_answer (str): Could be "YES", "NO", or "NONE" + * short_answer_start (int): Start index of token, -1 if does not exist + * short_answer_end (int): End index of token, -1 if does not exist + * long_answer_start (int): Start index of token, -1 if does not exist + * long_answer_end (int): End index of token, -1 if does not exist + * example_id (str): ID representing the string. + * relevant_excerpt (str): text containing the short answer + * other_canditates (list): list strings containing excerpts tagged + as long answer candidates but not containing the short answer + """ + logger.info("Running the Extraction stage...") + logger.info("=" * 30) + json_lines = [] + logger.info("Loading original .json file...") + extraction_counter = 0 + chunk_idx = ( + 0 # Used to group N examples together and write to a CSV. N=chunk_size + ) + with open(self._raw_nq_json_file) as f: + for line in tqdm.tqdm(f): + if extraction_counter == self._n_rows: + break + line = json.loads(line) + + out_di = { + "document_text": line["document_text"], + "question_text": line["question_text"], + } + + if "example_id" in line: + out_di["example_id"] = line["example_id"] + + annot = line["annotations"][0] + + # Dropping examples that don't have a long answer + if ( + self._drop_no_long_answer + and annot["long_answer"]["candidate_index"] == -1 + ): + continue + + out_di["yes_no_answer"] = annot["yes_no_answer"] + out_di["long_answer_start"] = annot["long_answer"]["start_token"] + out_di["long_answer_end"] = annot["long_answer"]["end_token"] + + if len(annot["short_answers"]) > 0: + out_di["short_answer_start"] = annot["short_answers"][0][ + "start_token" + ] + out_di["short_answer_end"] = annot["short_answers"][0]["end_token"] + else: + out_di["short_answer_start"] = -1 + out_di["short_answer_end"] = -1 + + candidate_index = annot["long_answer"]["candidate_index"] + # gather other long answer candidates that doesn't contain the short answer + other_long_answer_candidates = [ + line["long_answer_candidates"][i] + for i in range(len(line["long_answer_candidates"])) + if i != candidate_index + and line["long_answer_candidates"][i]["top_level"] is True + ] + + out_di["other_long_answer_candidates"] = other_long_answer_candidates + + json_lines.append(out_di) + extraction_counter += 1 + if extraction_counter % self._chunk_size == 0: + self._write_chunk_to_disk( + chunk_data=json_lines, chunk_idx=chunk_idx + ) + json_lines = [] + chunk_idx += 1 + + # Last chunk: + self._write_chunk_to_disk(chunk_data=json_lines, chunk_idx=chunk_idx) diff --git a/src/components/preprocessing/pdf_table_extractor.py b/src/components/preprocessing/pdf_table_extractor.py new file mode 100755 index 0000000..958e9d1 --- /dev/null +++ b/src/components/preprocessing/pdf_table_extractor.py @@ -0,0 +1,285 @@ +from .base_component import BaseComponent +import os +from pdf2image import convert_from_path, pdfinfo_from_path +from mmdet.apis import init_detector, inference_detector +import numpy as np +from tabula import read_pdf +from collections import defaultdict +from multiprocessing import Pool, cpu_count +from functools import partial +import subprocess + +import gdown +from tqdm import tqdm +from src.components.utils.cscdtabnet_checkpoint_url import checkpoint_url + +import logging + +_logger = logging.getLogger(__name__) + + +class PDFTableExtractor(BaseComponent): + def __init__( + self, + batch_size, + cscdtabnet_config, + cscdtabnet_ckpt, + bbox_thres, + dpi, + name="PDFTableExtractor", + ): + """ + Args: + batch_size (An int): How many pages to infer bbox each run + cscdtabnet_config (A PosixPath or str): Config file for cascadetabnet. + Should be placed in config folder + cscdtabnet_ckpt (A PosixPath or str): cascadetabnet checkpoint. + Should be placed + in checkpoint folder + bbox_thres (A float): Threshold to label a bbox as table + dpi (An int): dots per inch for pdf2image + name (A str) + """ + super().__init__(name) + self.batch_size = batch_size + self.cscdtabnet_config = str(cscdtabnet_config) + self.cscdtabnet_ckpt = str(cscdtabnet_ckpt) + self.bbox_thres = bbox_thres + self.dpi = dpi + self.model = self.__create_model() + + def __create_model(self): + """ + Download checkpoint file if not exist and return a detector model + Returns: + an init_detector + """ + ckpt = os.path.basename(self.cscdtabnet_ckpt) + assert ckpt in checkpoint_url.keys(), "Invalid cascadetabnet checkpoint" + + def download_ckpt(): + _ = gdown.download(checkpoint_url[ckpt], output=self.cscdtabnet_ckpt) + + if not os.path.exists(self.cscdtabnet_ckpt): + _logger.info("cascadetabnet checkpoint does not exist. Downloading...") + download_ckpt() + + # In case of connection error and incomplete download + download_successful = False + import torch + + device = "cpu" if "cpu" in torch.__version__ else "cuda:0" + while not download_successful: + try: + det = init_detector( + self.cscdtabnet_config, self.cscdtabnet_ckpt, device=device + ) + download_successful = True + except OSError: + _logger.info( + "Error while downloading cascadetabnet checkpoint. Redownloading..." + ) + download_ckpt() + + return det + + @staticmethod + def process_single_table(pdf_path, prefix, output_folder, dpi, iterable): + """Read a single table mentioned in pdf_path, it is as a standalone + function because of pickle issue + + Args: + pdf_path (str): Path to the pdf + prefix (str): The prefix name for saving the csv + output_folder (str): The output directory to sabe the extracted table + dpi + iterable (list): list of parameters pass by multi processing + iterable[0] (int): page number in the pdf + iterable[1] (int): the index of the tale in the page + iterable[2] (list of int): coordinates of the table. + Return: + table content (dataframe or None) + saved_filenam(str or None): Path the csv is saved + page_num (int): page number + """ + page_num = iterable[0] + table_index = iterable[1] + area = iterable[2] + try: + table = read_pdf( + pdf_path, + pages=page_num, + pandas_options={"header": None}, + stream=True, + silent=True, + area=[i * 72 / dpi for i in area], # tabula uses 72 dpi + ) + except subprocess.CalledProcessError: + _logger.warning( + "Tabula has error extracting table from file {}, page {}, area {}".format( + pdf_path, page_num, area + ) + ) + return None, None, page_num + + if len(table) != 0: + # ** This format is important as curation will use this format ** + saved_filename = "{}_page{}_{}.csv".format( + prefix, page_num, table_index + 1 + ) + filename = os.path.join(output_folder, saved_filename) + + table[0].to_csv(filename) + return table[0], saved_filename, page_num + else: + return None, None, page_num + + def infer_bbox(self, input_filepath): + """ + Infer bbox for 1 file + Args: + input_filepath (A str) + Returns: + table_coords (A dictionary): Key=page number, + value = a list of list of size 4. + [y_top_left, x_top_left, + y_bottom_right, x_bottom_right] + """ + try: + num_pages = pdfinfo_from_path(input_filepath)["Pages"] + except Exception as e: + _logger.warning("{}: Unable to process {}".format(e, input_filepath)) + return None + + pc = 0 + table_coords = defaultdict(list) + + if self.batch_size == -1: + batch_size_ = num_pages + else: + batch_size_ = self.batch_size + + page_num = 1 + pbar = tqdm(total=num_pages + 1, desc="Page") + while pc <= num_pages: + images = convert_from_path( + input_filepath, + first_page=pc + 1, + last_page=pc + batch_size_, + use_pdftocairo=True, + dpi=self.dpi, + thread_count=cpu_count() - 1, + ) + + # infer tables in an image + for im in tqdm( + images, + desc="Inferring tables for page {}-{}".format( + page_num, page_num + batch_size_ + ), + ): + result = inference_detector(self.model, np.array(im)) + bordered_tables = result[0][0] + borderless_tables = result[0][2] + + # could have multiple tables + for res in bordered_tables: + if res[-1] > self.bbox_thres: + # [y_top_left, x_top_left, y_bottom_right, x_bottom_right] + table_coords[page_num].append([res[1], res[0], res[3], res[2]]) + + for res in borderless_tables: + if res[-1] > self.bbox_thres: + # [y_top_left, x_top_left, y_bottom_right, x_bottom_right] + table_coords[page_num].append([res[1], res[0], res[3], res[2]]) + + page_num += 1 + + pc += batch_size_ + pbar.update(batch_size_) + + return table_coords + + def extract_table(self, input_filepath, table_coords, output_folder): + """Given filepath and table coordinates of tables in each page, + extract tables using tabula and save them as csv + Args: + input_filepath (A str or PosixPath) + table_coords (A dictionary): Key=page number, + value = a list of list of size 4. + [y_top_left, x_top_left, + y_bottom_right, x_bottom_right] + output_folder (A str or PosixPath) + + Returns: + tables (A dict): Key=page number, value = a list of dataframes + tables_meta (A dict): Key=page number, value=a list of filenames + """ + prefix = os.path.basename(input_filepath).split(".pdf")[0].strip() + + tables = defaultdict(list) + tables_meta = defaultdict(list) + + # -1 to leave some space for i/o operations + process_count = cpu_count() - 1 + func = partial( + self.process_single_table, input_filepath, prefix, output_folder, self.dpi + ) + with Pool(process_count) as p: + result = p.map( + func, + [ + (page_num, table_index, area) + for page_num in tqdm( + table_coords, desc="Extracting and saving tables" + ) + for table_index, area in enumerate(table_coords[page_num]) + ], + ) + + for tab, path, key in result: + if tab is not None: + tables[key].append(tab) + tables_meta[key].append(path) + + return tables, tables_meta + + def run(self, input_filepath, output_folder): + """Returns and saves tables extracted as csv + + Args: + input_filepath (A str or PosixPath) + output_folder (A str or PosixPath) + + Returns: + tables (A dict): See extract_table() + tables_meta (A dict): See extract_table() + """ + _logger.info("{} is running on file {}...".format(self.name, input_filepath)) + + table_coords = self.infer_bbox(input_filepath) + # unable to process pdf file + if table_coords is None: + return None + + tables, tables_meta = self.extract_table( + input_filepath, table_coords, output_folder + ) + + return (tables, tables_meta) + + def run_folder(self, input_folder, output_folder): + """Runs run() for a folder of pdfs. + + Args: + input_folder (A str or PosixPath) + output_folder (A str or PosixPath) + """ + files = [ + os.path.join(input_folder, f) + for f in os.listdir(input_folder) + if f.endswith(".pdf") + ] + + for f in files: + _ = self.run(f, output_folder) diff --git a/src/components/preprocessing/pdf_text_extractor.py b/src/components/preprocessing/pdf_text_extractor.py new file mode 100755 index 0000000..ec72546 --- /dev/null +++ b/src/components/preprocessing/pdf_text_extractor.py @@ -0,0 +1,180 @@ +import glob +import io +import json +import logging +import os +from pathlib import Path + +import pandas as pd +from pdf2image import pdfinfo_from_path +from pdfminer.converter import TextConverter +from pdfminer.layout import LAParams +from pdfminer.pdfinterp import PDFPageInterpreter +from pdfminer.pdfinterp import PDFResourceManager +from pdfminer.pdfpage import PDFPage + +from .base_component import BaseComponent +from .base_curator import BaseCurator + +_logger = logging.getLogger(__name__) + + +class PDFTextExtractor(BaseComponent): + """This Class is responsible for extracting text data from PDFs and saving + the result in a json format file. + Each name/value pair in the json file refers to page_number and + the list of paragraphs in that page. + Args: + min_paragraph_length (int): Minimum alphabetic characters for paragraph, + any paragraph shorter than that will be disregarded. + annotation_folder (str)(Optional): path to the folder containing all annotated + excel files. If provided, just the pdfs mentioned in annotation excels are + extracted. Otherwise, all the pdfs in the pdf folder will be extracted. + skip_extracted_files (bool): whether to skip extracting a file if it exist in the extraction folder. + name (str) : Name of the component + """ + + def __init__( + self, + annotation_folder=None, + min_paragraph_length=20, + skip_extracted_files=False, + name="PDFTextExtractor", + ): + super().__init__(name) + self.min_paragraph_length = min_paragraph_length + self.annotation_folder = annotation_folder + self.skip_extracted_files = skip_extracted_files + + def process_page(self, input_text): + """This function receives a text following: + 1. Divide it into paragraphs, using \n\n + 2. Remove table data: To achieve this, if number of alphabet characters of paragraph + is less min_paragraph_length, it is considered as table cell and it will be removed. + + Args: + input_text (str): Content of each pdf. + + Returns: + paragraphs (list of str): List of paragraphs. + """ + paragraphs = input_text.split("\n\n") + + # Get ride of table data if the number of alphabets in a paragraph is less than `min_paragraph_length` + paragraphs = [ + BaseCurator.clean_text(p) + for p in paragraphs + if sum(c.isalpha() for c in BaseCurator.clean_text(p)) + > self.min_paragraph_length + ] + return paragraphs + + def extract_pdf_by_page(self, pdf_file): + """Read the content of each page in a pdf file, this method uses pdfminer. + Args: + pdf_file (str): Path to the pdf file. + Returns: + pdf_content (dict): A dictionary with key as page number and values + as list of paragraphs in that page. + """ + try: + num_pages = pdfinfo_from_path(pdf_file) # noqa: F841 + except Exception as e: + _logger.warning("{}: Unable to process {}".format(e, pdf_file)) + return {} + + fp = open(pdf_file, "rb") + rsrcmgr = PDFResourceManager() + retstr = io.BytesIO() + codec = "utf-8" + laparams = LAParams() + device = TextConverter(rsrcmgr, retstr, codec=codec, laparams=laparams) + interpreter = PDFPageInterpreter(rsrcmgr, device) + + pdf_content = {} + for page_number, page in enumerate( + PDFPage.get_pages(fp, check_extractable=False) + ): + interpreter.process_page(page) + data = retstr.getvalue().decode("utf-8") + data_paragraphs = self.process_page(data) + if len(data_paragraphs) == 0: + continue + pdf_content[page_number] = data_paragraphs + retstr.truncate(0) + retstr.seek(0) + fp.close() + + return pdf_content + + def run(self, input_filepath, output_folder): + """Extract text from a single pdf file + Args: + input_filepath (str or PosixPath): full path to the pdf file + output_folder (str or PosixPath): Folder to save the result of extraction + """ + output_file_name = os.path.splitext(os.path.basename(input_filepath))[0] + json_filename = output_file_name + ".json" + + if self.skip_extracted_files and json_filename in os.listdir(output_folder): + _logger.info( + "The extracted json for `{}` already exists. Skipping...".format( + output_file_name + ) + ) + _logger.info( + "If you would like to re-extract the already processed files, set " + "`skip_extracted_files` to False in the config file. " + ) + return None + + _logger.info("Extracting {} ...".format(os.path.basename(input_filepath))) + text_dict = self.extract_pdf_by_page(input_filepath) + if text_dict == {}: + return None + + json_path = os.path.join(output_folder, json_filename) + with open(json_path, "w") as f: + json.dump(text_dict, f) + + return text_dict + + def run_folder(self, input_folder, output_folder): + """This method will perform pdf extraction for all the pdfs mentioned + as source in the annotated excel files + and it will be saved the results in a output_folder. + + Args: + input_folder (str or PosixPath): Path to the folder containing + all the received pdf files. + output_folder (str or PosixPath): path to the folder to save the + extracted json files. + """ + files = [str(f) for f in Path(input_folder).rglob("*.pdf") if f.is_file()] + print(files) + if self.annotation_folder is not None: + # Get the names of all excel files + all_annotation_files = glob.glob( + "{}/[!~$]*[.xlsx]".format(self.annotation_folder) + ) + annotated_pdfs = [] + for excel_path in all_annotation_files: + df = pd.read_excel(excel_path, sheet_name="data_ex_in_xls") + # Get the unique values of source_file column + df_unique_pdfs = df["source_file"].drop_duplicates().dropna() + annotated_pdfs.extend(df_unique_pdfs) + annotated_pdfs = [file.split(".pdf")[0] + ".pdf" for file in annotated_pdfs] + found_annotated_pdfs = [] + + for f in files: + if os.path.basename(f) in annotated_pdfs: + found_annotated_pdfs.append(os.path.basename(f)) + _ = self.run(f, output_folder) + _logger.info( + "The following files in the annotation excels do not exist in pdf folder\n" + ) + _logger.info(set(annotated_pdfs).difference(set(found_annotated_pdfs))) + + else: + for f in files: + _ = self.run(f, output_folder) diff --git a/src/components/preprocessing/table_curator.py b/src/components/preprocessing/table_curator.py new file mode 100755 index 0000000..13a4392 --- /dev/null +++ b/src/components/preprocessing/table_curator.py @@ -0,0 +1,404 @@ +import logging +import os +import random +import numpy as np +import xlrd +from collections import defaultdict + +import pandas as pd +from fuzzywuzzy import fuzz + +from src.components.utils.kpi_mapping import KPI_MAPPING, KPI_CATEGORY +from .base_curator import BaseCurator + +logger = logging.getLogger(__name__) + + +class TableCurator(BaseCurator): + def __init__( + self, + neg_pos_ratio, + columns_to_read, + company_to_exclude, + seed=42, + create_neg_samples=False, + name="DataTableCurator", + data_type="TABLE", + ): + """This class is the responsible for creating ESG table dataset + (positive and negative examples) based on the annotations. + Args: + neg_pos_ratio (int): Ratio between negative to positive samples. + ex. For the ratio of two, for each positive examples, + approximately two negative samples will be created. + create_neg_samples (bool): Create negative samples + columns_to_read (A list of str): Columns to read from excels + company_to_exclude (A list of str): Companies to exclude + name (str) : Name of the component + """ + super().__init__(name) + self.neg_pos_ratio = neg_pos_ratio + self.create_neg_samples = create_neg_samples + self.columns_to_read = columns_to_read + self.data_type = data_type + self.company_to_exclude = company_to_exclude + random.seed(seed) + + def run(self, extraction_folder, annotation_excels, output_folder): + """This is the main method for creating ESG table dataset. It saves + all examples in a csv. + + Args: + extraction_folder (str): Path to the extraction folder. In the + extraction phase pdf are read and saved as csv files. Contains a + table_meta.json file + annotation_excels (A list of str): Paths to annotation excels + output_folder (str) : Output folder to save the curated dataset. + """ + self.extraction_folder = extraction_folder + self.output_folder = output_folder + self.annotation_excels = annotation_excels + self.filename_to_stringarr = self.__obtain_filename_to_strarr() + + examples_list = [] + for excel_file in self.annotation_excels: + examples_excel = self.process_single_annotation_file(excel_file) + examples_list.extend(examples_excel) + + df_result = pd.DataFrame(examples_list).reset_index(drop=True) + df_result.columns = [ + "Company", + "Year", + "Question", + "Answer", + "Table_filename", + "Label", + ] + + # TODO: Remove hard coded + df_result.to_csv( + os.path.join( + self.output_folder, "esg_{}_dataset.csv".format(self.data_type) + ) + ) + + def create_pos_examples(self, row, tables_samepdf): + """ + Args: + row (A pandas.Series) + tables_samepdf (A dict): Key= Page number (A str), value = A list of + table csv paths + + Returns: + multi_examples (A list of lists): [[str, str, str, str, str, int]]. + [] if no table is found in the page + """ + company = row["company"] + year = row["year"] + answer = row["answer"] + source_page = row["source_page"] + question = row["question"] + label = 1 + + multi_examples = [] + for p in source_page: + if p not in tables_samepdf.keys(): + logger.warning( + "Table detector did not find any table in page {} for file {}".format( + p, row["source_file"] + ) + ) + else: + relevant_filename = self.find_relevant_table(answer, p, tables_samepdf) + + example = [company, year, question, answer, relevant_filename, label] + + multi_examples.append(example) + + return multi_examples + + def create_negative_examples(self, row, pos_filename, tables_samepdf): + """ + Args: + row (A pandas.Series) + pos_filename (A str): File name of positive table + tables_samepdf (A dict): Key= Page number (A str), value = A list of + table csv paths + + Returns: + examples (A list of lists or empty list): [[str, int, str, None, str, int],...] + """ + company = row["company"] + year = row["year"] + question = row["question"] + label = 0 + + # If kpi id is valid, this will run + all_tables_in_samepdf = [k for i in tables_samepdf.values() for k in i] + negative_files_samepdf = [i for i in all_tables_in_samepdf if i != pos_filename] + negative_files_diffpdf = [ + i + for i in list(self.filename_to_stringarr) + if i != pos_filename and i not in negative_files_samepdf + ] + + # Getting negative examples from other pdfs if there is insufficient within + # same pdf + if self.neg_pos_ratio > len(negative_files_samepdf): + neg = negative_files_samepdf + extra_neg = random.sample( + negative_files_diffpdf, self.neg_pos_ratio - len(neg) + ) + neg.extend(extra_neg) + else: + neg = random.sample(negative_files_samepdf, self.neg_pos_ratio) + + examples = [[company, year, question, None, nf, label] for nf in neg] + + return examples + + def find_relevant_table(self, answer, source_page, tables_samepdf): + """ + Args: + answer (A str) + source_page (A str): E.g. "21" + tables_samepdf (A dict): Key= Page number (A str), value = A list of + table csv paths + + Returns: + (A str): table file name which has highest matching score + to the answer. + + """ + related_tables = tables_samepdf[source_page] + scores = [] + for rel_tab in related_tables: + score = fuzz.token_set_ratio( + " ".join(map(str, self.filename_to_stringarr[rel_tab])), answer + ) + scores.append(score) + + return related_tables[np.argmax(scores)] + + def __obtain_filename_to_strarr(self): + """ + Returns: + filename_to_stringarr(a dictionary): Key = table csv + path (str), value = a list of strings in the table + """ + extraction_files = [ + f for f in os.listdir(self.extraction_folder) if f.endswith(".csv") + ] + + # Map csv filename to a list of strings in the table + filename_to_stringarr = dict() + for f in extraction_files: + data = pd.read_csv(os.path.join(self.extraction_folder, f), index_col=0) + tab_arr = data.values.flatten() + words = tab_arr[~pd.isnull(tab_arr)] + filename_to_stringarr[f] = words.tolist() + + return filename_to_stringarr + + def __clean_annotation_file(self, df, annotation_filepath): + """Returns a clean dataframe after dropping all NaN rows, + dropping rows which has NaN values in some of the columns + (refer below), filter by TABLE and exclude certain companies, + mapping kpi id to question and remove rows with invalid kpi id, + cleaning source_page to get a list of str removing rows with invalid + source_page, finally adding annotator's name. + + Args: + df (A dataframe) + annotation_filepath (A str or PosixPath) + """ + # dropping all nan rows + df = ( + df[self.columns_to_read] + .dropna(axis=0, how="all", subset=self.columns_to_read) + .reset_index(drop=True) + ) + + # Drop rows with NaN for all columns except answer + df = df.dropna( + axis=0, + how="any", + subset=["company", "source_file", "source_page", "kpi_id", "year"], + ).reset_index(drop=True) + + # Filter dataframe to rows which are table and exclude certain companies + boolean = df.data_type == self.data_type + + for exclude in self.company_to_exclude: + boolean = boolean & (df.company != exclude) + df = df[boolean] + + # Get pdf filename right (don't need to make it a class method) + def get_pdf_name_right(f): + if not f.endswith(".pdf"): + if f.endswith(",pdf"): + filename = f.split(",pdf")[0].strip() + ".pdf" + else: + filename = f.strip() + ".pdf" + else: + filename = f.split(".pdf")[0].strip() + ".pdf" + + return filename + + df["source_file"] = df["source_file"].apply(get_pdf_name_right) + + # kpi mapping. No need to make it as class method + def map_kpi(r): + try: + question = KPI_MAPPING[float(r)] + except (KeyError, ValueError): + question = None + + return question + + df["question"] = df["kpi_id"].apply(map_kpi) + invalid_kpi = df[df["question"].isna()]["kpi_id"].unique().tolist() + if len(invalid_kpi) != 0: + logger.warning( + "File {} has invalid kpis: {}".format( + os.path.basename(annotation_filepath), invalid_kpi + ) + ) + + # Remove examples with invalid kpi + df = df.dropna(axis=0, subset=["question"]).reset_index(drop=True) + + # Remove examples where source_page can't be parsed + def clean_page(sp): + if sp[0] != "[" or sp[-1] != "]": + return None + else: + # Covers multi pages and fix cases like '02' + return [str(int(i)) for i in sp[1:-1].split(",")] + + temp = df["source_page"].apply(clean_page) + invalid_source_page = df["source_page"][temp.isna()].unique().tolist() + if len(invalid_source_page) != 0: + logger.warning( + "File {} has invalid source_page format: {}".format( + os.path.basename(annotation_filepath), + df["source_page"][temp.isna()].unique(), + ) + ) + + df["source_page"] = temp + df = df.dropna(axis=0, subset=["source_page"]).reset_index(drop=True) + + # Remove examples with incorrect kpi-data_type pair + def clean_id(r): + kpi_id = float(r["kpi_id"]) + + if r["data_type"] in KPI_CATEGORY[kpi_id]: + cat = True + else: + cat = False + + return cat + + correct_id_bool = df[["kpi_id", "data_type"]].apply(clean_id, axis=1) + df = df[correct_id_bool].reset_index(drop=True) + diff = correct_id_bool.shape[0] - df.shape[0] + if diff > 0: + logger.info( + "Drop {} examples for {} due to incorrect kpi-data_type pair".format( + diff, annotation_filepath + ) + ) + + df["annotator"] = os.path.basename(annotation_filepath) + return df + + def __create_table_meta(self): + """Returns a dictionary of key = pdf file name, value = a dictionary + where key = page num, value = a list of table csvs from that page + + Returns: + meta_dict (A dict of dict) + """ + extraction_files = [ + f for f in os.listdir(self.extraction_folder) if f.endswith(".csv") + ] + + meta_list = defaultdict(list) + + for f in extraction_files: + filename = f.split("_page")[0].strip() + ".pdf" + meta_list[filename].append(f) + + meta_dict = defaultdict(dict) + for f in meta_list: + temp = defaultdict(list) + for c in meta_list[f]: + page = c.split("_page")[1].split("_")[0] + temp[page].append(c) + meta_dict[f] = temp + + return meta_dict + + def process_single_annotation_file( + self, annotation_filepath, sheet_name="data_ex_in_xls" + ): + """Create examples for a single excel file + Args: + annotation_filepath (str): Path to the annotated excel file + sheet_name (A str): Sheet which contains data + Returns: + examples (list of lists): List of positive and negative examples + extracted from excel file + """ + logger.debug("Processing excel file {}".format(annotation_filepath)) + + # Excel file corrupted + try: + df = pd.read_excel(annotation_filepath, sheet_name=sheet_name) + except xlrd.biffh.XLRDError as err: + logger.warning( + "Trouble reading excel file {}: {}".format(annotation_filepath, err) + ) + return [[]] + + # Check if df has all columns + if any([e not in df.columns for e in self.columns_to_read]): + logger.warning( + "Excel file {} has missing columns from {}".format( + annotation_filepath, self.columns_to_read + ) + ) + return [[]] + + # clean dataframe + df = self.__clean_annotation_file(df, annotation_filepath) + + # table_meta contains {pdf_name:{page: list of table csvs, ...}, ...} + table_meta = self.__create_table_meta() + + examples = [] + for i, row in df.iterrows(): + tables_samepdf = table_meta[row["source_file"]] + + # skip curation process if pdf does not exist + if len(tables_samepdf) == 0: + logger.warning("{} was not extracted.".format(row["source_file"])) + continue + + positive_example = self.create_pos_examples(row.copy(), tables_samepdf) + + # It will be empty if no table found in the page + if positive_example == []: + continue + + pos_filename = positive_example[0][4] + if self.create_neg_samples: + negative_examples = self.create_negative_examples( + row.copy(), pos_filename, tables_samepdf + ) + examples.extend(negative_examples + positive_example) + else: + examples.extend(positive_example) + + return examples diff --git a/src/components/preprocessing/text_curator.py b/src/components/preprocessing/text_curator.py new file mode 100755 index 0000000..3cb3f6b --- /dev/null +++ b/src/components/preprocessing/text_curator.py @@ -0,0 +1,379 @@ +import ast +import json +import logging +import os +import random +import re +from pathlib import Path +import importlib +import pandas as pd + +import src.components.utils.kpi_mapping as kpi_mapping +from .base_curator import BaseCurator + +logger = logging.getLogger(__name__) + + +class TextCurator(BaseCurator): + def __init__( + self, + retrieve_paragraph, + neg_pos_ratio, + columns_to_read, + company_to_exclude, + seed=42, + create_neg_samples=False, + min_length_neg_sample=50, + name="DataTextCurator", + data_type="TEXT", + ): + """This class is the responsible for creating ESG text dataset + (positive and negative examples) based on the annotations. + Args: + retrieve_paragraph (bool): Whether or not try to extract the whole + paragraph based on the annotated sentence + neg_pos_ratio (int): Ratio between negative to positive samples. + ex. For the ratio of two, for each positive + examples, approximately two negative samples + will be created. + columns_to_read (A list of str): A list of column names + company_to_exclude (A list of str): A list of companies to exclude + create_neg_samples (bool): Create negative samples + min_length_neg_sample (int): minimum length of negative example + name (str) : Name of the component + """ + super().__init__(name) + self.retrieve_paragraph = retrieve_paragraph + self.neg_pos_ratio = neg_pos_ratio + self.columns_to_read = columns_to_read + self.company_to_exclude = company_to_exclude + self.create_neg_samples = create_neg_samples + self.min_length_neg_sample = min_length_neg_sample + self.data_type = data_type + random.seed(seed) + + def run(self, extraction_folder, annotation_excels, output_folder): + """This is the main method for creating ESG text dataset. + Args: + extraction_folder (str): Path to the extraction folder. In the + extraction phase pdf are read and saved as json files. + annotation_excels (A list of str): Paths to excel files + output_folder (str) : Output folder to save the curated dataset. + """ + # TODO: Move us to init + self.extraction_folder = extraction_folder + self.output_folder = output_folder + self.annotation_excels = annotation_excels + + examples_list = [] + for excel_file in annotation_excels: + examples_excel = self.process_single_annotation_file(excel_file) + examples_list.extend(examples_excel) + + df_result = pd.DataFrame(examples_list).reset_index(drop=True) + # Drop the unnecessary column. + df_result.drop(["Index"], axis=1, inplace=True) + + # Map the KPI to KPI questions + importlib.reload(kpi_mapping) + + df_result["question"] = df_result.astype({"kpi_id": "float"}, errors="ignore")[ + "kpi_id" + ].map(kpi_mapping.KPI_MAPPING) + # In the result csv, the following KPIs are not mapped to any questions. + # To avoid losing any data, the following + # KPIs should be modified manually. + logger.warning( + "The corresponding KPIs can not be mapped \ + to any questions and the mapped question is empty\n{}".format( + df_result[df_result["question"].isna()]["kpi_id"].unique() + ) + ) + + # Remove the rows could not map KPI to question + df_result = df_result[df_result.question.notnull()] + # Remove duplicate examples + df_result = df_result.groupby(["question", "context"]).first().reset_index() + + save_path = os.path.join( + output_folder, "esg_{}_dataset.csv".format(self.data_type) + ) + logger.info("Curated {} examples".format(len(df_result))) + logger.info("Saving the dataset in {}".format(save_path)) + df_result.to_csv(save_path) + + def process_single_annotation_file( + self, annotation_filepath, sheet_name="data_ex_in_xls" + ): + """Create examples for a single excel file + Args: + annotation_filepath (str): Path to the annotated excel file + sheet_name (A str): Sheet which contains data + Returns: + examples (list of pandas.core.series.Series): List of positive and + negative examples extracted + from excel file + """ + logger.debug("Processing excel file {}".format(annotation_filepath)) + df = pd.read_excel(annotation_filepath, sheet_name=sheet_name)[ + self.columns_to_read + ] + + # Filter dataframe to rows which are table and exclude certain companies + boolean = (df.data_type == self.data_type) & (df.relevant_paragraphs.notnull()) + + for exclude in self.company_to_exclude: + boolean = boolean & (df.company != exclude) + df = df[boolean] + df["annotator"] = os.path.basename(annotation_filepath) + + examples = [] + for i, row in df.iterrows(): + row["Index"] = i + positive_examples = self.create_pos_examples(row.copy()) + + examples.extend(positive_examples) + + if self.create_neg_samples: + negative_examples = self.create_negative_examples(row.copy()) + if negative_examples is not None: + examples.extend(negative_examples) + + return examples + + def create_pos_examples(self, row): + """Given each row of annotations, this method creates pos examples. + Note: this method can extract the whole paragraph in the pdf where the + relevant_paragraph is mentioned. + For each row, there might be more than one positive examples if the + list of relevant_paragraph column contains more than one element. + + Args: + row (pandas.core.series.Series): each row of pandas data frame + Returns: + pos_rows (list of pandas.core.series.Series): A list of positive examples, + each row has two more members, + "context" and "label" of 1. + """ + # Change the format of relevant_paragraphs from string to list + sentences = self.process_relevant_sentences(row) + # The above method will return None, if it cannot process + # relevance_paragraph column. + if sentences is None: + return [] + + if self.retrieve_paragraph and not pd.isnull(row["source_page"]): + paragraphs = self.get_full_paragraph(row, sentences) + # If method cannot extract relevant paragraphs based on relevant + # sentences, it will return empty list. + if len(paragraphs) == 0: + paragraphs = sentences + else: + paragraphs = sentences + + pos_rows = [] + for p in paragraphs: + row_copy = row.copy() + row_copy["context"] = p + row_copy["label"] = 1 + pos_rows.append(row_copy) + + return pos_rows + + def create_negative_examples(self, row): + """Create negative examples for each row, to achieve this: + - If the source pdf is presented and extracted, we choose a random page, + except source page and choose a random paragraph within that. + - If the extracted pdf is not available, we look for the a random + extracted pdf and choose a random paragraph inside that. + + Args: + row (pandas.core.series.Series): each row of pandas data frame + Return: + neg_rows (list of pandas.core.series.Series): A list of negative + examples, each row has + two more members, + context and label of 0. + """ + pdf_content = self.load_pdf_content(row) + # if the corresponding pdf to a row is not presented, a random pdf is + # picked to create negative example + if len(pdf_content) == 0: + random_json_path = random.choice( + list(Path(self.extraction_folder).rglob("*.json")) + ) + with open(os.path.join(self.extraction_folder, random_json_path)) as f: + pdf_content = [json.load(f)] + + try: + selected_pages = [p - 1 for p in ast.literal_eval(row["source_page"])] + except SyntaxError: + if len(self.load_pdf_content(row)) == 0: + selected_pages = [] + else: + return None + + neg_rows = [] + for _ in range(int(self.neg_pos_ratio)): + while True: + if (len(pdf_content[0]) - 1) < 3: + return None + negative_page = random.randint(3, len(pdf_content[0]) - 1) + if negative_page in selected_pages: + continue + negative_page_content = pdf_content[0][str(negative_page)] + if len(negative_page_content) == 0: + continue + negative_context = random.choice(negative_page_content) + negative_context = self.clean_text(negative_context) + if len(negative_context) < self.min_length_neg_sample: + continue + break + + # Before assigning value, create a copy of it + row_copy = row.copy() + row_copy["context"] = negative_context + row_copy["label"] = 0 + neg_rows.append(row_copy) + + return neg_rows + + def process_relevant_sentences(self, row): + """Extract relevant paragraph based on the 'relevant_paragraphs' column + This method will check the format of relevant paragraph and if it does + not follow the standard, the logger will print out information about that + and will return None. + Note: To not lose any data, the excel files can be manually modified and + the program should be run again. + + Args: + row (pandas.core.series.Series) + Return: + sentence_revised (list of str) List of relevant sentences""" + sentence_revised = self.clean_text(row["relevant_paragraphs"]) + + if sentence_revised.startswith("[") or sentence_revised.endswith("]"): + try: + return ast.literal_eval(sentence_revised) + except SyntaxError: + # This happens if there is an issue in the relevant paragraph. + # + 1 special case + # TODO: Solve the especial case: it happens if there is double + # quotes in the sentence. + # 2 is added because to be compatible, so it would be compatible + # with what you see in MS excel. + logger.warning( + "Could not process row number {} in {}".format( + (row["Index"] + 2), row["annotator"] + ) + ) + return None + else: + # To support cases where relevant paragraph are given as strings. + logger.info( + "Not in a list format row number {} , {}".format( + (row["Index"] + 2), row["annotator"] + ) + ) + return [sentence_revised] + + def get_full_paragraph(self, row, relevant_sentences): + """This method will find the full paragraph where the relevant_sentence column + is coming from. To achieve this: + + The content of the pdf mentioned in the source_page is loaded. + The content of page mentioned in source_page is selected. + The extracted text is divided by paragraphs "\n\n" + For each paragraphs in the page, will find a match for relevant_paragraph. + Note: The result can be an empty list if the paragraph can not retrieved. + Args: + row (pandas.core.series.Series): Each row of pandas dataframe. + relevant_sentences (list of str): List of processed relevant_paragraphs. + Returns: + matches_list (list of str): list of full paragraphs. + """ + pdf_content = self.load_pdf_content(row) + try: + source_page = ast.literal_eval(row["source_page"]) + except SyntaxError: + logger.info( + "Can not process source page in row {} of {} ".format( + (row["Index"] + 2), row["annotator"] + ) + ) + return [] + # pdfminer starts the page counter as 0 while for pdf viewers the first + # page is numbered as 1. + selected_pages = [p - 1 for p in source_page] + paragraphs = [ + pdf.get(str(p), []) for p in selected_pages for pdf in pdf_content + ] + paragraphs_flat = [item for sublist in paragraphs for item in sublist] + matches_list = [] + for pattern in relevant_sentences: + special_regex_char = [ + "(", + ")", + "^", + "+", + "*", + "$", + "|", + "\\", + "?", + "[", + "]", + "{", + "}", + ] + # If the sentences contain the especial character we should put \ + # before them for literal match. + pattern = "".join( + ["\\" + c if c in special_regex_char else c for c in pattern] + ) + for single_par in paragraphs_flat: + single_par_clean = self.clean_text(single_par) + match = re.search(pattern, single_par_clean, re.I) + if match is not None: + matches_list.append(single_par_clean) + break + + return matches_list + + def load_pdf_content(self, row): + """Load the content of a pdf file + If the extraction step is passed, the json file should be in the + extraction_folder. + Args: + row (list of pandas.core.series.Series) + Returns: + (list of dict): List of pdfs' content that has the relevant name + after extraction. + """ + # The naming format is used in extraction phase. + extracted_filename = ( + os.path.splitext(str(row["source_file"]))[0] + "-" + str(row["company"]) + ) + # Get all the files in extraction folder that has the desired name + extracted_paths = [ + path + for path in os.listdir(self.extraction_folder) + if extracted_filename in path + ] + + pdf_contents = [] + for path in extracted_paths: + with open(os.path.join(self.extraction_folder, path)) as f: + pdf_contents.append(json.load(f)) + return pdf_contents + # TODO: Support cases where the source pdf exists in the pdf_folder but it is not extracted. + # else: + # # Look for the pdf name in the pdf folders that are the same as source column. + # source_pdf_path = self.get_path_pdf(config.PDF_FOLDER, row.source_file) + # if source_pdf_path is None: + # logger.info("The related mentioned pdf {} in {} not found, and the extracted not found" + # .format(row.annotator, row.source)) + # return None + # # Get the content for all files named as source file name in annotations. + # pdf_content = [PDFTextExtractor.extract_pdf_by_page(path) for path in source_pdf_path] + # return pdf_content diff --git a/src/components/utils/__init__.py b/src/components/utils/__init__.py new file mode 100755 index 0000000..e69de29 diff --git a/src/components/utils/cscdtabnet_checkpoint_url.py b/src/components/utils/cscdtabnet_checkpoint_url.py new file mode 100755 index 0000000..ac6cc26 --- /dev/null +++ b/src/components/utils/cscdtabnet_checkpoint_url.py @@ -0,0 +1,10 @@ +checkpoint_url = { + "general_model.pth": "https://drive.google.com/uc?id=1-xfq5hDmFdKgbY9FSFTmhSlcb2p13RPn", + "icdar_13.pth": "https://drive.google.com/uc?id=1-mVr4UBicFk3mjUz5tsVPjQ4jzRtiT7V", + "icdar_19A.pth": "https://drive.google.com/uc?id=1vfUr4pmmI4GICZubAnBeFU8pviMUW_c9", + "tablebank_word.pth": "https://drive.google.com/uc?id=1-ZnV84t61IrkAfQH7dOATpo_T4C1J4Qa", + "tablebank_latex.pth": "https://drive.google.com/uc?id=1-9EzU_LfD6fE8iJFjOZ3nBsCObqhpNUa", + "tablebank_both.pth": "https://drive.google.com/uc?id=1-vjfGRhF8kqvKwZPPFNwiTaOoonJlGgv", + "icdar_19b2.pth": "https://drive.google.com/uc?id=1zmFbQ_3QToD22XHhKpnRnhBVOgKl-Lp7", + "icdar_19b2_v2.pth": "https://drive.google.com/uc?id=1dmYzZP8eF6_EkkJagN6NJ9A7ReOy_ICY", +} diff --git a/src/components/utils/kpi_mapping.py b/src/components/utils/kpi_mapping.py new file mode 100755 index 0000000..7065fed --- /dev/null +++ b/src/components/utils/kpi_mapping.py @@ -0,0 +1,15 @@ +import pandas as pd +from src.components import config + +df = pd.read_csv(config.ROOT / "data/kpi_mapping.csv", header=0) +_KPI_MAPPING = {str(i[0]): i[1] for i in df[["kpi_id", "question"]].values} +KPI_MAPPING = {(float(key)): value for key, value in _KPI_MAPPING.items()} + +# Which questions should be added the year +ADD_YEAR = df[df["add_year"]].kpi_id.tolist() + +# Category where the answer to the question should originate from +KPI_CATEGORY = { + i[0]: [j.strip() for j in i[1].split(", ")] + for i in df[["kpi_id", "kpi_category"]].values +} diff --git a/src/components/utils/nq_utils.py b/src/components/utils/nq_utils.py new file mode 100755 index 0000000..dd4679b --- /dev/null +++ b/src/components/utils/nq_utils.py @@ -0,0 +1,24 @@ +import re + + +def get_text_section(doc_tokens): + """Return section of text from a whitespace separated document""" + return " ".join(doc_tokens[0].split(" ")[doc_tokens[1] : doc_tokens[2]]) + + +def contains_table(text): + """Returns True if a string contains an HTML table""" + if re.search(r"