diff --git a/research/.gitignore b/research/.gitignore index 934305f7..3cdaa558 100644 --- a/research/.gitignore +++ b/research/.gitignore @@ -1,3 +1,4 @@ comprehensiondatas/ asap-aes/ feedback-prize-2021/ +pretrained/ diff --git a/research/Data Augmentation with NLP.ipynb b/research/Data Augmentation with NLP.ipynb new file mode 100644 index 00000000..c7ee44ed --- /dev/null +++ b/research/Data Augmentation with NLP.ipynb @@ -0,0 +1,405 @@ +{ + "cells": [ + { + "cell_type": "code", + "execution_count": 10, + "id": "5198b5db", + "metadata": { + "ExecuteTime": { + "end_time": "2022-02-21T11:09:49.000368Z", + "start_time": "2022-02-21T11:09:48.991377Z" + } + }, + "outputs": [], + "source": [ + "import nlpaug.augmenter.char as nac\n", + "import nlpaug.augmenter.word as naw\n", + "import nlpaug.augmenter.sentence as nas\n", + "import nlpaug.flow as nafc\n", + "import nlpaug\n", + "\n", + "from nlpaug.util import Action\n", + "\n", + "import pandas as pd" + ] + }, + { + "cell_type": "code", + "execution_count": 3, + "id": "ef52b23c", + "metadata": { + "ExecuteTime": { + "end_time": "2022-02-21T10:51:13.388707Z", + "start_time": "2022-02-21T10:51:13.304667Z" + } + }, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + " | text | \n", + "label | \n", + "score | \n", + "start | \n", + "end | \n", + "source | \n", + "
---|---|---|---|---|---|---|
0 | \n", + "In 2019 a wave of anti-abortion laws swept thi... | \n", + "Evidence | \n", + "0.983720 | \n", + "0 | \n", + "528 | \n", + "abortion-florida-15-week-ban | \n", + "
1 | \n", + "Though most of these laws were quickly blocked... | \n", + "Evidence | \n", + "0.934319 | \n", + "528 | \n", + "908 | \n", + "abortion-florida-15-week-ban | \n", + "
2 | \n", + "Three years later, American reproductive right... | \n", + "Evidence | \n", + "0.622358 | \n", + "908 | \n", + "1214 | \n", + "abortion-florida-15-week-ban | \n", + "
3 | \n", + "It might seem curious, then, that legislators ... | \n", + "Evidence | \n", + "0.946866 | \n", + "1214 | \n", + "1722 | \n", + "abortion-florida-15-week-ban | \n", + "
4 | \n", + "One of this year’s unmistakable trends in anti... | \n", + "Evidence | \n", + "0.991869 | \n", + "1722 | \n", + "2394 | \n", + "abortion-florida-15-week-ban | \n", + "
... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "
3893 | \n", + "And boy did it come | \n", + "Claim | \n", + "0.982928 | \n", + "2554 | \n", + "2573 | \n", + "yosemite-falls | \n", + "
3894 | \n", + "But the record rains will not end California’s... | \n", + "Rebuttal | \n", + "0.880377 | \n", + "2573 | \n", + "2636 | \n", + "yosemite-falls | \n", + "
3895 | \n", + "Last week, Gov. Gavin Newsom extended the stat... | \n", + "Claim | \n", + "0.541481 | \n", + "2636 | \n", + "2769 | \n", + "yosemite-falls | \n", + "
3896 | \n", + "This has been California’s second driest year ... | \n", + "Evidence | \n", + "0.479049 | \n", + "2769 | \n", + "2925 | \n", + "yosemite-falls | \n", + "
3897 | \n", + "Severe drought conditions, worsened by climate... | \n", + "Claim | \n", + "0.478424 | \n", + "2925 | \n", + "3080 | \n", + "yosemite-falls | \n", + "
3898 rows × 6 columns
\n", + "\n", + " | text | \n", + "label | \n", + "score | \n", + "start | \n", + "end | \n", + "source | \n", + "
---|---|---|---|---|---|---|
0 | \n", + "In 2019 a wave of anti-abortion laws swept thi... | \n", + "Evidence | \n", + "0.983720 | \n", + "0 | \n", + "528 | \n", + "abortion-florida-15-week-ban | \n", + "
1 | \n", + "Though most of these laws were quickly blocked... | \n", + "Evidence | \n", + "0.934319 | \n", + "528 | \n", + "908 | \n", + "abortion-florida-15-week-ban | \n", + "
2 | \n", + "Three years later, American reproductive right... | \n", + "Evidence | \n", + "0.622358 | \n", + "908 | \n", + "1214 | \n", + "abortion-florida-15-week-ban | \n", + "
3 | \n", + "It might seem curious, then, that legislators ... | \n", + "Evidence | \n", + "0.946866 | \n", + "1214 | \n", + "1722 | \n", + "abortion-florida-15-week-ban | \n", + "
4 | \n", + "One of this year’s unmistakable trends in anti... | \n", + "Evidence | \n", + "0.991869 | \n", + "1722 | \n", + "2394 | \n", + "abortion-florida-15-week-ban | \n", + "
... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "
3893 | \n", + "And boy did it come | \n", + "Claim | \n", + "0.982928 | \n", + "2554 | \n", + "2573 | \n", + "yosemite-falls | \n", + "
3894 | \n", + "But the record rains will not end California’s... | \n", + "Rebuttal | \n", + "0.880377 | \n", + "2573 | \n", + "2636 | \n", + "yosemite-falls | \n", + "
3895 | \n", + "Last week, Gov. Gavin Newsom extended the stat... | \n", + "Claim | \n", + "0.541481 | \n", + "2636 | \n", + "2769 | \n", + "yosemite-falls | \n", + "
3896 | \n", + "This has been California’s second driest year ... | \n", + "Evidence | \n", + "0.479049 | \n", + "2769 | \n", + "2925 | \n", + "yosemite-falls | \n", + "
3897 | \n", + "Severe drought conditions, worsened by climate... | \n", + "Claim | \n", + "0.478424 | \n", + "2925 | \n", + "3080 | \n", + "yosemite-falls | \n", + "
3898 rows × 6 columns
\n", + "\n", + " | textualScore | \n", + "
---|---|
0 | \n", + "0.813205 | \n", + "
1 | \n", + "0.685687 | \n", + "
2 | \n", + "0.809620 | \n", + "
3 | \n", + "0.800835 | \n", + "
4 | \n", + "0.731424 | \n", + "
... | \n", + "... | \n", + "
154 | \n", + "0.772159 | \n", + "
155 | \n", + "0.844647 | \n", + "
156 | \n", + "0.714356 | \n", + "
157 | \n", + "0.670670 | \n", + "
158 | \n", + "0.797801 | \n", + "
159 rows × 1 columns
\n", + "\n", - " | label | \n", - "text | \n", - "is_valid | \n", - "
---|---|---|---|
0 | \n", - "negative | \n", - "Un-bleeping-believable! Meg Ryan doesn't even look her usual pert lovable self in this, which normally makes me forgive her shallow ticky acting schtick. Hard to believe she was the producer on this dog. Plus Kevin Kline: what kind of suicide trip has his career been on? Whoosh... Banzai!!! Finally this was directed by the guy who did Big Chill? Must be a replay of Jonestown - hollywood style. Wooofff! | \n", - "False | \n", - "
1 | \n", - "positive | \n", - "This is a extremely well-made film. The acting, script and camera-work are all first-rate. The music is good, too, though it is mostly early in the film, when things are still relatively cheery. There are no really superstars in the cast, though several faces will be familiar. The entire cast does an excellent job with the script.<br /><br />But it is hard to watch, because there is no good end to a situation like the one presented. It is now fashionable to blame the British for setting Hindus and Muslims against each other, and then cruelly separating them into two countries. There is som... | \n", - "False | \n", - "
2 | \n", - "negative | \n", - "Every once in a long while a movie will come along that will be so awful that I feel compelled to warn people. If I labor all my days and I can save but one soul from watching this movie, how great will be my joy.<br /><br />Where to begin my discussion of pain. For starters, there was a musical montage every five minutes. There was no character development. Every character was a stereotype. We had swearing guy, fat guy who eats donuts, goofy foreign guy, etc. The script felt as if it were being written as the movie was being shot. The production value was so incredibly low that it felt li... | \n", - "False | \n", - "
3 | \n", - "positive | \n", - "Name just says it all. I watched this movie with my dad when it came out and having served in Korea he had great admiration for the man. The disappointing thing about this film is that it only concentrate on a short period of the man's life - interestingly enough the man's entire life would have made such an epic bio-pic that it is staggering to imagine the cost for production.<br /><br />Some posters elude to the flawed characteristics about the man, which are cheap shots. The theme of the movie \"Duty, Honor, Country\" are not just mere words blathered from the lips of a high-brassed offic... | \n", - "False | \n", - "
4 | \n", - "negative | \n", - "This movie succeeds at being one of the most unique movies you've seen. However this comes from the fact that you can't make heads or tails of this mess. It almost seems as a series of challenges set up to determine whether or not you are willing to walk out of the movie and give up the money you just paid. If you don't want to feel slighted you'll sit through this horrible film and develop a real sense of pity for the actors involved, they've all seen better days, but then you realize they actually got paid quite a bit of money to do this and you'll lose pity for them just like you've alr... | \n", - "False | \n", - "
... | \n", - "... | \n", - "... | \n", - "... | \n", - "
995 | \n", - "negative | \n", - "There are many different versions of this one floating around, so make sure you can locate one of the unrated copies, otherwise some gore and one scene of nudity might be missing. Some versions also omit most of the opening sequence and other bits here and there. The cut I saw has the on-screen title WITCHCRAFT: EVIL ENCOUNTERS and was released by Shriek Show, who maintain the original US release title WITCHERY for the DVD release. It's a nice-looking print and seems to have all of the footage, but has some cropping/aspect ratio issues. In Italy, it was released as LA CASA 4 (WITCHCRAFT). ... | \n", - "True | \n", - "
996 | \n", - "positive | \n", - "Once upon a time Hollywood produced live-action, G-rated movies without foul language, immorality, and gore-splattered violence. These movies neither insulted your intelligence no manipulated your emotions. The heroes differed little from the crowd. They shared the same feelings and bore the same burdens. Since the 1970s, the film industry has pretty much written off G-rated movies for adults. Basically, modern mature audiences demand large doses of embellished realism for their cinematic diet, laced heavily with vile profanity, mattress-thumping sex, and knuckle-bruising fisticuffs. These... | \n", - "True | \n", - "
997 | \n", - "negative | \n", - "Wenders was great with Million $ Hotel.I don't know how he came up with this film! The idea of giving the situation after spt11 and the view of American Society is hopeful,that makes it 2 out of ten.But this is not a movie.Is that the best someone can do with a great idea(the west-east clash).There are important things going on in middle east and it is just issued on the screen of a MAC* with the fingers of an Amerian girl who is actually at the level of stupidity(because she is just ignorant about the facts).The characters are not well shaped.And the most important thing is the idea that ... | \n", - "True | \n", - "
998 | \n", - "negative | \n", - "Although a film with Bruce Willis is always worth watching, you better skip this one. I watched this one on television, so I didn't have to plunk down cash for it. Lucky me.<br /><br />The plot develops slowly, very slowly. Although the first 30 minutes or so are quite believable, it gets more and more unbelievable towards the end. It is highly questionable, if a seasoned soldier like Lt. Waters would disobey direct orders. And even if he would, if the rest of his platoon would. They know he puts them in direct danger, and they know they will certainly die if they follow him, but what the ... | \n", - "True | \n", - "
999 | \n", - "positive | \n", - "A compelling, honest, daring, and unforgettable psychological horror film that touches on the painful experiences of pain caused by rape - \"Descent\" is a film that went under-the-radar due to its lack of distribution because, frankly, the film is so brutal in its depictions, that if it had been released theatrically, it may have met itself to some strong biased hate.<br /><br />The film deserves to be discovered for, not only its dark themes, and not only for its amazing direction and authentic style - but most of all for its performances. Chad Faust is absolutely stunning, bringing enough... | \n", - "True | \n", - "
1000 rows × 3 columns
\n", - "144293 rows × 9 columns
\n", + "3898 rows × 6 columns
\n", "" ], "text/plain": [ - " id discourse_id discourse_start discourse_end \\\n", - "0 423A1CA112E2 1.622628e+12 8.0 229.0 \n", - "1 423A1CA112E2 1.622628e+12 230.0 312.0 \n", - "2 423A1CA112E2 1.622628e+12 313.0 401.0 \n", - "3 423A1CA112E2 1.622628e+12 402.0 758.0 \n", - "4 423A1CA112E2 1.622628e+12 759.0 886.0 \n", - "... ... ... ... ... \n", - "144288 4C471936CD75 1.618153e+12 2234.0 3203.0 \n", - "144289 4C471936CD75 1.618153e+12 3221.0 4509.0 \n", - "144290 4C471936CD75 1.618025e+12 4510.0 4570.0 \n", - "144291 4C471936CD75 1.618025e+12 4570.0 4922.0 \n", - "144292 4C471936CD75 1.618025e+12 4935.0 5825.0 \n", - "\n", - " text \\\n", - "0 Modern humans today are always on their phone. They are always on their phone more than 5 hours a day no stop .All they do is text back and forward and just have group Chats on social media. They even do it while driving. \n", - "1 They are some really bad consequences when stuff happens when it comes to a phone. \n", - "2 Some certain areas in the United States ban phones from class rooms just because of it. \n", - "3 When people have phones, they know about certain apps that they have .Apps like Facebook Twitter Instagram and Snapchat. So like if a friend moves away and you want to be in contact you can still be in contact by posting videos or text messages. People always have different ways how to communicate with a phone. Phones have changed due to our generation. \n", - "4 Driving is one of the way how to get around. People always be on their phones while doing it. Which can cause serious Problems. \n", - "... ... \n", - "144288 if I'm not sure what college I want to attend, and I ask one friend where I should go, they might say \"George Mason\" as a suggestion. But if George Mason is not in fact the best college for me, even though the person I asked was trying to help, that one opinion could sway me to go there anyway and not have the best experience. But yet if I go to ten people to advice, including the person who suggested George Mason, they might be the only one who would say that and maybe five of the other people I asked might say Virginia Tech, and I would decide to go to Virginia Tech instead of to George... \n", - "144289 seeking multiple opinions before making a hard decision can be beneficial because of the reasons stated above. When I was in second grade, I passed the test to be admitted into the AAP (Advanced Academics Program) in my school. My best friend was also accepted, and wanted me to go to AAP with her, but I didnt really want to go into AAP. I told my parents this, and they agreed it would be best for me to stay in the normal class for on more year. Since I got my parents' opinions, I also felt more secure staying out of the advanced program even though my friend wanted me to do the opposite a... \n", - "144290 it is better to seek multiple opinions instead of just one. \n", - "144291 The impact of asking people to help you make a decision can be big, like a country deciding to go to war, or small, like a third grader choosing if they want to go into the advanced program in school, but nonetheless, asking for other people's opinions instead of just one person's opinion can make a difference in someone's life, whether big or small. \n", - "144292 there are many other reasons one might want to seek multiple opinions and pieces of advice instead of just one, but these are the two main ones that I think really make it worthwhile to ask for advice from multiple people instead of making decisions with only one piece of advice from one person. The key thing that all of these examples have shown is that it is better to seek multiple opinions from multiple different people than to only get advice from one. This is ultimately because asking multiple people for advice makes you feel better about the decisions you make and also increases the ... \n", + " text \\\n", + "0 In 2019 a wave of anti-abortion laws swept this country — a common enough event in the United States, where hundreds of such laws have passed during the last decade. But these grabbed the public’s attention in a way many others hadn’t. Georgia banned abortion after about six weeks of pregnancy, or about two weeks after a missed menstrual period. Ohio, Mississippi, Louisiana and Kentucky did the same, while Missouri banned the procedure at eight weeks. Alabama went the furthest, banning virtually all abortions in the state. \n", + "1 Though most of these laws were quickly blocked by the courts — they were obviously unconstitutional under Roe v. Wade — the backlash to their passing was intense, especially in Georgia, a major hub of film and television production. Boycotts were threatened. Netflix and Disney spoke out. The actress Alyssa Milano even tried to get a “Lysistrata”-style sex strike off the ground. \n", + "2 Three years later, American reproductive rights are on an even bleaker trajectory. A Supreme Court decision that’s expected to come down this summer is likely to strike down Roe v. Wade, either in deed or in word, making it possible for states with anti-abortion leadership to ban the procedure altogether. \n", + "3 It might seem curious, then, that legislators in some conservative-leaning states are spending these months before the likely downfall of Roe working to pass less extreme abortion measures than they did in 2019. Now seems like the time for anti-abortion legislators to go for broke. The fact that some of them are pursuing a different strategy offers clues about what a post-Roe America could look like, and how that landscape could be more complex — and less predetermined — than some Americans had assumed. \n", + "4 One of this year’s unmistakable trends in anti-abortion legislation is the 15-week ban. Legislators in Arizona, Florida and West Virginia are now considering bills — which, as the name suggests, would ban abortion after 15 weeks of pregnancy, in violation of Roe. At first blush, it might seem these states are simply copying the Mississippi law that the Supreme Court seems likely to uphold this summer, in Dobbs v. Jackson Women’s Health Organization. But why would they hold back now, rather than try to get more draconian legislation through their legislatures? Florida even considered a six-... \n", + "... ... \n", + "3893 And boy did it come \n", + "3894 But the record rains will not end California’s ongoing drought. \n", + "3895 Last week, Gov. Gavin Newsom extended the state’s drought emergency and asked residents to redouble their water conservation efforts. \n", + "3896 This has been California’s second driest year on record, with near-record low storage in the state’s largest reservoirs, according to the governor’s office. \n", + "3897 Severe drought conditions, worsened by climate change, continue to affect much of the Western United States and even the northern part of the Great Plains. \n", "\n", - " label discourse_type_num \\\n", - "0 Lead Lead 1 \n", - "1 Position Position 1 \n", - "2 Evidence Evidence 1 \n", - "3 Evidence Evidence 2 \n", - "4 Claim Claim 1 \n", - "... ... ... \n", - "144288 Evidence Evidence 2 \n", - "144289 Evidence Evidence 3 \n", - "144290 Position Position 1 \n", - "144291 Evidence Evidence 4 \n", - "144292 Concluding Statement Concluding Statement 1 \n", + " label score start end source \n", + "0 Evidence 0.983720 0 528 abortion-florida-15-week-ban \n", + "1 Evidence 0.934319 528 908 abortion-florida-15-week-ban \n", + "2 Evidence 0.622358 908 1214 abortion-florida-15-week-ban \n", + "3 Evidence 0.946866 1214 1722 abortion-florida-15-week-ban \n", + "4 Evidence 0.991869 1722 2394 abortion-florida-15-week-ban \n", + "... ... ... ... ... ... \n", + "3893 Claim 0.982928 2554 2573 yosemite-falls \n", + "3894 Rebuttal 0.880377 2573 2636 yosemite-falls \n", + "3895 Claim 0.541481 2636 2769 yosemite-falls \n", + "3896 Evidence 0.479049 2769 2925 yosemite-falls \n", + "3897 Claim 0.478424 2925 3080 yosemite-falls \n", "\n", - " predictionstring \\\n", - "0 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 \n", - "1 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 \n", - "2 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 \n", - "3 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 \n", - "4 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 \n", - "... ... \n", - "144288 386 387 388 389 390 391 392 393 394 395 396 397 398 399 400 401 402 403 404 405 406 407 408 409 410 411 412 413 414 415 416 417 418 419 420 421 422 423 424 425 426 427 428 429 430 431 432 433 434 435 436 437 438 439 440 441 442 443 444 445 446 447 448 449 450 451 452 453 454 455 456 457 458 459 460 461 462 463 464 465 466 467 468 469 470 471 472 473 474 475 476 477 478 479 480 481 482 483 484 485 486 487 488 489 490 491 492 493 494 495 496 497 498 499 500 501 502 503 504 505 506 507 508 509 510 511 512 513 514 515 516 517 518 519 520 521 522 523 524 525 526 527 528 529 530 531 532 533 534 ... \n", - "144289 576 577 578 579 580 581 582 583 584 585 586 587 588 589 590 591 592 593 594 595 596 597 598 599 600 601 602 603 604 605 606 607 608 609 610 611 612 613 614 615 616 617 618 619 620 621 622 623 624 625 626 627 628 629 630 631 632 633 634 635 636 637 638 639 640 641 642 643 644 645 646 647 648 649 650 651 652 653 654 655 656 657 658 659 660 661 662 663 664 665 666 667 668 669 670 671 672 673 674 675 676 677 678 679 680 681 682 683 684 685 686 687 688 689 690 691 692 693 694 695 696 697 698 699 700 701 702 703 704 705 706 707 708 709 710 711 712 713 714 715 716 717 718 719 720 721 722 723 724 ... \n", - "144290 828 829 830 831 832 833 834 835 836 837 838 \n", - "144291 839 840 841 842 843 844 845 846 847 848 849 850 851 852 853 854 855 856 857 858 859 860 861 862 863 864 865 866 867 868 869 870 871 872 873 874 875 876 877 878 879 880 881 882 883 884 885 886 887 888 889 890 891 892 893 894 895 896 897 898 899 900 901 902 \n", - "144292 905 906 907 908 909 910 911 912 913 914 915 916 917 918 919 920 921 922 923 924 925 926 927 928 929 930 931 932 933 934 935 936 937 938 939 940 941 942 943 944 945 946 947 948 949 950 951 952 953 954 955 956 957 958 959 960 961 962 963 964 965 966 967 968 969 970 971 972 973 974 975 976 977 978 979 980 981 982 983 984 985 986 987 988 989 990 991 992 993 994 995 996 997 998 999 1000 1001 1002 1003 1004 1005 1006 1007 1008 1009 1010 1011 1012 1013 1014 1015 1016 1017 1018 1019 1020 1021 1022 1023 1024 1025 1026 1027 1028 1029 1030 1031 1032 1033 1034 1035 1036 1037 1038 1039 1040 1041 1042 1... \n", - "\n", - " is_valid \n", - "0 False \n", - "1 False \n", - "2 False \n", - "3 False \n", - "4 False \n", - "... ... \n", - "144288 True \n", - "144289 True \n", - "144290 True \n", - "144291 True \n", - "144292 True \n", - "\n", - "[144293 rows x 9 columns]" + "[3898 rows x 6 columns]" ] }, - "execution_count": 22, + "execution_count": 5, "metadata": {}, "output_type": "execute_result" } ], "source": [ - "df = pd.read_csv(\"feedback-prize-2021/train.csv\").rename(columns={\"discourse_text\":\"text\", \"discourse_type\":\"label\"})\n", - "l = df.shape[0]\n", - "df[\"is_valid\"] = [False for i in range(int(l * 0.7))] + [True for i in range(l-int(l * 0.7))]\n", + "df = pd.read_csv(\"datagen/nytimes/pseudo.csv\")\n", "df" ] }, { "cell_type": "code", - "execution_count": 24, - "id": "64600ce4", - "metadata": { - "ExecuteTime": { - "end_time": "2022-02-20T15:40:45.428309Z", - "start_time": "2022-02-20T15:35:23.806772Z" - } - }, - "outputs": [ - { - "name": "stdout", - "output_type": "stream", - "text": [ - "Due to IPython and Windows limitation, python multiprocessing isn't available now.\n", - "So `n_workers` has to be changed to 0 to avoid getting stuck\n", - "Due to IPython and Windows limitation, python multiprocessing isn't available now.\n", - "So `number_workers` is changed to 0 to avoid getting stuck\n" - ] - }, - { - "data": { - "text/html": [ - "\n", - " | text | \n", - "category | \n", - "
---|---|---|
0 | \n", - "xxbos xxmaj in the year 1976 , when xxmaj viking 1 space craft was taking photographs of possiable landing spots for xxmaj viking 2 spacecraft , they found a formation in a rock that looked like a human face . xxmaj the shadows made the rock look like it had a nose , mouth , and two eyes , like a human . xxmaj this was found in a region of the xxmaj red xxmaj planet called xxmaj cydonia . xxmaj the \" head \" was nearly two miles from end to end , and it seemed to be starring back at the cameras . \\n\\n xxmaj the controllers back at the xxmaj jet xxmaj propulsion xxmaj lab were probably quite surprised when this face popped up on their screens , looking them right in the eyes . xxmaj this sensation was short lived . xxmaj scientist figured it was | \n", - "Evidence | \n", - "
1 | \n", - "xxbos xxmaj for me a car is very important , because if you have a car you can move to other places that you want . xxmaj but not only that , if you have an emergency you can go rapidly , or in time . xxmaj but this is not a facility in all countries and exist much problems with that , for example in xxmaj germany the street parking , driveways and home garages , this are generally forbidden , new district on the outskirts of xxmaj freiburg , near the xxmaj french and xxmaj swiss . but in xxmaj vauban 's streets are completly car free , this is so good , but with a limit , like ▁ except the main thoroughfare , where the tram to downtown xxmaj freiburg runs . \\n\\n xxmaj in xxunk a result , 70 percent of xxmaj vauban 's families | \n", - "Evidence | \n", - "
epoch | \n", - "train_loss | \n", - "valid_loss | \n", - "accuracy | \n", - "perplexity | \n", - "time | \n", - "
---|
\n", - "\n", - "
\n", + " | text | \n", + "label | \n", + "score | \n", + "start | \n", + "end | \n", + "source | \n", + "
---|---|---|---|---|---|---|
0 | \n", + "The metaverse is coming. It was once a science... | \n", + "Lead | \n", + "0.913818 | \n", + "0 | \n", + "348 | \n", + "metaverse-politics-disinformation-society | \n", + "
1 | \n", + "In the metaverse, a user might curate a digita... | \n", + "Evidence | \n", + "0.457832 | \n", + "348 | \n", + "642 | \n", + "metaverse-politics-disinformation-society | \n", + "
2 | \n", + "But while the metaverse could revolutionize wo... | \n", + "Rebuttal | \n", + "0.857951 | \n", + "642 | \n", + "790 | \n", + "metaverse-politics-disinformation-society | \n", + "
3 | \n", + "Virtual environments will supercharge disinfor... | \n", + "Evidence | \n", + "0.730927 | \n", + "790 | \n", + "1177 | \n", + "metaverse-politics-disinformation-society | \n", + "
4 | \n", + "A failure to anticipate these possibilities ma... | \n", + "Claim | \n", + "0.484750 | \n", + "1177 | \n", + "1323 | \n", + "metaverse-politics-disinformation-society | \n", + "
5 | \n", + "Today, glimpses of the metaverse are everywher... | \n", + "Lead | \n", + "0.699519 | \n", + "1323 | \n", + "1708 | \n", + "metaverse-politics-disinformation-society | \n", + "
6 | \n", + "There’s already evidence that online multiplay... | \n", + "Evidence | \n", + "0.613328 | \n", + "1708 | \n", + "1954 | \n", + "metaverse-politics-disinformation-society | \n", + "
7 | \n", + "The metaverse could allow motivated regimes or... | \n", + "Evidence | \n", + "0.683931 | \n", + "1954 | \n", + "2188 | \n", + "metaverse-politics-disinformation-society | \n", + "
8 | \n", + "In environments where individuals can be repre... | \n", + "Claim | \n", + "0.549679 | \n", + "2188 | \n", + "2399 | \n", + "metaverse-politics-disinformation-society | \n", + "
9 | \n", + "Digital espionage has already been used by doz... | \n", + "Evidence | \n", + "0.686262 | \n", + "2399 | \n", + "2752 | \n", + "metaverse-politics-disinformation-society | \n", + "
10 | \n", + "Countries and corporations alike will likely a... | \n", + "Claim | \n", + "0.816655 | \n", + "2752 | \n", + "2885 | \n", + "metaverse-politics-disinformation-society | \n", + "
11 | \n", + "States have already used facial recognition te... | \n", + "Evidence | \n", + "0.959065 | \n", + "2885 | \n", + "3243 | \n", + "metaverse-politics-disinformation-society | \n", + "
12 | \n", + "Even the metaverse’s physical infrastructure w... | \n", + "Claim | \n", + "0.963662 | \n", + "3243 | \n", + "3328 | \n", + "metaverse-politics-disinformation-society | \n", + "
13 | \n", + "A constellation of technologies, including har... | \n", + "Evidence | \n", + "0.870708 | \n", + "3328 | \n", + "3653 | \n", + "metaverse-politics-disinformation-society | \n", + "
14 | \n", + "China could effectively control the metaverse’... | \n", + "Evidence | \n", + "0.893361 | \n", + "3653 | \n", + "3988 | \n", + "metaverse-politics-disinformation-society | \n", + "
15 | \n", + "This kind of physical infrastructure will, in ... | \n", + "Evidence | \n", + "0.863372 | \n", + "3988 | \n", + "4281 | \n", + "metaverse-politics-disinformation-society | \n", + "
16 | \n", + "Despite these threats, the metaverse also has ... | \n", + "Rebuttal | \n", + "0.626262 | \n", + "4281 | \n", + "4631 | \n", + "metaverse-politics-disinformation-society | \n", + "
17 | \n", + "Virtual environments have also shown promise f... | \n", + "Evidence | \n", + "0.980946 | \n", + "4631 | \n", + "5027 | \n", + "metaverse-politics-disinformation-society | \n", + "
18 | \n", + "But the metaverse’s consequences may be even m... | \n", + "Rebuttal | \n", + "0.859729 | \n", + "5027 | \n", + "5085 | \n", + "metaverse-politics-disinformation-society | \n", + "
19 | \n", + "If it becomes as all-encompassing as some pred... | \n", + "Evidence | \n", + "0.821782 | \n", + "5085 | \n", + "5496 | \n", + "metaverse-politics-disinformation-society | \n", + "
20 | \n", + "The metaverse may have been born in science fi... | \n", + "Position | \n", + "0.460967 | \n", + "5496 | \n", + "5615 | \n", + "metaverse-politics-disinformation-society | \n", + "
21 | \n", + "The metaverse is coming. It was once a science... | \n", + "Lead | \n", + "0.913818 | \n", + "0 | \n", + "348 | \n", + "metaverse-politics-disinformation-society | \n", + "
22 | \n", + "In the metaverse, a user might curate a digita... | \n", + "Evidence | \n", + "0.457832 | \n", + "348 | \n", + "642 | \n", + "metaverse-politics-disinformation-society | \n", + "
23 | \n", + "But while the metaverse could revolutionize wo... | \n", + "Rebuttal | \n", + "0.857951 | \n", + "642 | \n", + "790 | \n", + "metaverse-politics-disinformation-society | \n", + "
24 | \n", + "Virtual environments will supercharge disinfor... | \n", + "Evidence | \n", + "0.730927 | \n", + "790 | \n", + "1177 | \n", + "metaverse-politics-disinformation-society | \n", + "
25 | \n", + "A failure to anticipate these possibilities ma... | \n", + "Claim | \n", + "0.484750 | \n", + "1177 | \n", + "1323 | \n", + "metaverse-politics-disinformation-society | \n", + "
26 | \n", + "Today, glimpses of the metaverse are everywher... | \n", + "Lead | \n", + "0.699519 | \n", + "1323 | \n", + "1708 | \n", + "metaverse-politics-disinformation-society | \n", + "
27 | \n", + "There’s already evidence that online multiplay... | \n", + "Evidence | \n", + "0.613328 | \n", + "1708 | \n", + "1954 | \n", + "metaverse-politics-disinformation-society | \n", + "
28 | \n", + "The metaverse could allow motivated regimes or... | \n", + "Evidence | \n", + "0.683931 | \n", + "1954 | \n", + "2188 | \n", + "metaverse-politics-disinformation-society | \n", + "
29 | \n", + "In environments where individuals can be repre... | \n", + "Claim | \n", + "0.549679 | \n", + "2188 | \n", + "2399 | \n", + "metaverse-politics-disinformation-society | \n", + "
30 | \n", + "Digital espionage has already been used by doz... | \n", + "Evidence | \n", + "0.686262 | \n", + "2399 | \n", + "2752 | \n", + "metaverse-politics-disinformation-society | \n", + "
31 | \n", + "Countries and corporations alike will likely a... | \n", + "Claim | \n", + "0.816655 | \n", + "2752 | \n", + "2885 | \n", + "metaverse-politics-disinformation-society | \n", + "
32 | \n", + "States have already used facial recognition te... | \n", + "Evidence | \n", + "0.959065 | \n", + "2885 | \n", + "3243 | \n", + "metaverse-politics-disinformation-society | \n", + "
33 | \n", + "Even the metaverse’s physical infrastructure w... | \n", + "Claim | \n", + "0.963662 | \n", + "3243 | \n", + "3328 | \n", + "metaverse-politics-disinformation-society | \n", + "
34 | \n", + "A constellation of technologies, including har... | \n", + "Evidence | \n", + "0.870708 | \n", + "3328 | \n", + "3653 | \n", + "metaverse-politics-disinformation-society | \n", + "
35 | \n", + "China could effectively control the metaverse’... | \n", + "Evidence | \n", + "0.893361 | \n", + "3653 | \n", + "3988 | \n", + "metaverse-politics-disinformation-society | \n", + "
36 | \n", + "This kind of physical infrastructure will, in ... | \n", + "Evidence | \n", + "0.863372 | \n", + "3988 | \n", + "4281 | \n", + "metaverse-politics-disinformation-society | \n", + "
37 | \n", + "Despite these threats, the metaverse also has ... | \n", + "Rebuttal | \n", + "0.626262 | \n", + "4281 | \n", + "4631 | \n", + "metaverse-politics-disinformation-society | \n", + "
38 | \n", + "Virtual environments have also shown promise f... | \n", + "Evidence | \n", + "0.980946 | \n", + "4631 | \n", + "5027 | \n", + "metaverse-politics-disinformation-society | \n", + "
39 | \n", + "But the metaverse’s consequences may be even m... | \n", + "Rebuttal | \n", + "0.859729 | \n", + "5027 | \n", + "5085 | \n", + "metaverse-politics-disinformation-society | \n", + "
40 | \n", + "If it becomes as all-encompassing as some pred... | \n", + "Evidence | \n", + "0.821782 | \n", + "5085 | \n", + "5496 | \n", + "metaverse-politics-disinformation-society | \n", + "
41 | \n", + "The metaverse may have been born in science fi... | \n", + "Position | \n", + "0.460967 | \n", + "5496 | \n", + "5615 | \n", + "metaverse-politics-disinformation-society | \n", + "
\n", + " | text | \n", + "label | \n", + "score | \n", + "start | \n", + "end | \n", + "source | \n", + "
---|---|---|---|---|---|---|
0 | \n", + "In 2019 a wave of anti-abortion laws swept thi... | \n", + "Evidence | \n", + "0.983720 | \n", + "0 | \n", + "528 | \n", + "abortion-florida-15-week-ban | \n", + "
1 | \n", + "Though most of these laws were quickly blocked... | \n", + "Evidence | \n", + "0.934319 | \n", + "528 | \n", + "908 | \n", + "abortion-florida-15-week-ban | \n", + "
2 | \n", + "Three years later, American reproductive right... | \n", + "Evidence | \n", + "0.622358 | \n", + "908 | \n", + "1214 | \n", + "abortion-florida-15-week-ban | \n", + "
3 | \n", + "It might seem curious, then, that legislators ... | \n", + "Evidence | \n", + "0.946866 | \n", + "1214 | \n", + "1722 | \n", + "abortion-florida-15-week-ban | \n", + "
4 | \n", + "One of this year’s unmistakable trends in anti... | \n", + "Evidence | \n", + "0.991869 | \n", + "1722 | \n", + "2394 | \n", + "abortion-florida-15-week-ban | \n", + "
... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "
3893 | \n", + "And boy did it come | \n", + "Claim | \n", + "0.982928 | \n", + "2554 | \n", + "2573 | \n", + "yosemite-falls | \n", + "
3894 | \n", + "But the record rains will not end California’s... | \n", + "Rebuttal | \n", + "0.880377 | \n", + "2573 | \n", + "2636 | \n", + "yosemite-falls | \n", + "
3895 | \n", + "Last week, Gov. Gavin Newsom extended the stat... | \n", + "Claim | \n", + "0.541481 | \n", + "2636 | \n", + "2769 | \n", + "yosemite-falls | \n", + "
3896 | \n", + "This has been California’s second driest year ... | \n", + "Evidence | \n", + "0.479049 | \n", + "2769 | \n", + "2925 | \n", + "yosemite-falls | \n", + "
3897 | \n", + "Severe drought conditions, worsened by climate... | \n", + "Claim | \n", + "0.478424 | \n", + "2925 | \n", + "3080 | \n", + "yosemite-falls | \n", + "
3898 rows × 6 columns
\n", + "\n", + " | text | \n", + "label | \n", + "score | \n", + "start | \n", + "end | \n", + "source | \n", + "
---|---|---|---|---|---|---|
0 | \n", + "In 2019 a wave of anti-abortion laws swept thi... | \n", + "Evidence | \n", + "0.983720 | \n", + "0 | \n", + "528 | \n", + "abortion-florida-15-week-ban | \n", + "
1 | \n", + "Though most of these laws were quickly blocked... | \n", + "Evidence | \n", + "0.934319 | \n", + "528 | \n", + "908 | \n", + "abortion-florida-15-week-ban | \n", + "
2 | \n", + "Three years later, American reproductive right... | \n", + "Evidence | \n", + "0.622358 | \n", + "908 | \n", + "1214 | \n", + "abortion-florida-15-week-ban | \n", + "
3 | \n", + "It might seem curious, then, that legislators ... | \n", + "Evidence | \n", + "0.946866 | \n", + "1214 | \n", + "1722 | \n", + "abortion-florida-15-week-ban | \n", + "
4 | \n", + "One of this year’s unmistakable trends in anti... | \n", + "Evidence | \n", + "0.991869 | \n", + "1722 | \n", + "2394 | \n", + "abortion-florida-15-week-ban | \n", + "
... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "
3893 | \n", + "And boy did it come | \n", + "Claim | \n", + "0.982928 | \n", + "2554 | \n", + "2573 | \n", + "yosemite-falls | \n", + "
3894 | \n", + "But the record rains will not end California’s... | \n", + "Rebuttal | \n", + "0.880377 | \n", + "2573 | \n", + "2636 | \n", + "yosemite-falls | \n", + "
3895 | \n", + "Last week, Gov. Gavin Newsom extended the stat... | \n", + "Claim | \n", + "0.541481 | \n", + "2636 | \n", + "2769 | \n", + "yosemite-falls | \n", + "
3896 | \n", + "This has been California’s second driest year ... | \n", + "Evidence | \n", + "0.479049 | \n", + "2769 | \n", + "2925 | \n", + "yosemite-falls | \n", + "
3897 | \n", + "Severe drought conditions, worsened by climate... | \n", + "Claim | \n", + "0.478424 | \n", + "2925 | \n", + "3080 | \n", + "yosemite-falls | \n", + "
3898 rows × 6 columns
\n", + "\n", + " | textualScore | \n", + "
---|---|
0 | \n", + "0.813205 | \n", + "
1 | \n", + "0.685687 | \n", + "
2 | \n", + "0.809620 | \n", + "
3 | \n", + "0.800835 | \n", + "
4 | \n", + "0.731424 | \n", + "
... | \n", + "... | \n", + "
154 | \n", + "0.772159 | \n", + "
155 | \n", + "0.844647 | \n", + "
156 | \n", + "0.714356 | \n", + "
157 | \n", + "0.670670 | \n", + "
158 | \n", + "0.797801 | \n", + "
159 rows × 1 columns
\n", + "