<86>Dec 4 18:51:44 userdel[2617143]: delete user 'rooter' <86>Dec 4 18:51:44 groupadd[2617158]: group added to /etc/group: name=rooter, GID=648 <86>Dec 4 18:51:44 groupadd[2617158]: group added to /etc/gshadow: name=rooter <86>Dec 4 18:51:44 groupadd[2617158]: new group: name=rooter, GID=648 <86>Dec 4 18:51:44 useradd[2617171]: new user: name=rooter, UID=648, GID=648, home=/root, shell=/bin/bash <86>Dec 4 18:51:44 userdel[2617226]: delete user 'builder' <86>Dec 4 18:51:44 userdel[2617226]: removed group 'builder' owned by 'builder' <86>Dec 4 18:51:44 userdel[2617226]: removed shadow group 'builder' owned by 'builder' <86>Dec 4 18:51:44 groupadd[2617287]: group added to /etc/group: name=builder, GID=649 <86>Dec 4 18:51:44 groupadd[2617287]: group added to /etc/gshadow: name=builder <86>Dec 4 18:51:44 groupadd[2617287]: new group: name=builder, GID=649 <86>Dec 4 18:51:44 useradd[2617296]: new user: name=builder, UID=649, GID=649, home=/usr/src, shell=/bin/bash /usr/src/in/srpm/boilerpipe-1.2.0-alt1_13jpp8.src.rpm: license not found in '/usr/share/license' directory: ASL /usr/src/in/srpm/boilerpipe-1.2.0-alt1_13jpp8.src.rpm: license not found in '/usr/share/license' directory: 2.0 <13>Dec 4 18:51:48 rpmi: rpm-macros-java-1:5.3.0-alt1_4jpp8 sisyphus+234467.100.1.1 1563037789 installed <13>Dec 4 18:51:52 rpmi: javapackages-filesystem-1:5.3.0-alt1_4jpp8 sisyphus+234467.100.1.1 1563037789 installed <13>Dec 4 18:51:52 rpmi: javapackages-tools-1:5.3.0-alt1_4jpp8 sisyphus+234467.100.1.1 1563037789 installed <13>Dec 4 18:51:52 rpmi: libpng16-1.6.37-alt1 sisyphus+236677.100.2.1 1566917998 installed <13>Dec 4 18:51:52 rpmi: libexpat-2.2.10-alt1 sisyphus+259966.100.1.1 1602824518 installed <13>Dec 4 18:51:52 rpmi: xorg-proto-devel-2020.1-alt1 sisyphus+250406.100.1.1 1587554810 installed <13>Dec 4 18:51:52 rpmi: perl-HTTP-Date-6.05-alt1 sisyphus+258981.100.1.1 1601542386 installed <13>Dec 4 18:51:52 rpmi: libwayland-client-1.18.0-alt1 sisyphus+255795.100.1.1 1596475648 installed <13>Dec 4 18:51:52 rpmi: libjpeg-2:2.0.2-alt1 sisyphus+226996.100.1.1 1554902907 installed <13>Dec 4 18:51:52 rpmi: libICE-1.0.10-alt1 sisyphus+247690.100.1.1 1584000387 installed <13>Dec 4 18:51:52 rpmi: libSM-1.2.3-alt1 sisyphus+226734.100.2.1 1554586158 installed <13>Dec 4 18:51:52 rpmi: beust-jcommander-1.71-alt1_6jpp8 sisyphus+230680.100.1.3 1559093321 installed <13>Dec 4 18:51:52 rpmi: xmvn-api-3.0.0-alt1_23jpp8 sisyphus+234592.200.1.1 1563216657 installed <13>Dec 4 18:51:52 rpmi: xmvn-core-3.0.0-alt1_23jpp8 sisyphus+234592.200.1.1 1563216657 installed <13>Dec 4 18:51:52 rpmi: xml-commons-apis-1.4.01-alt3_29jpp8 sisyphus+246084.100.1.1 1581616535 installed <13>Dec 4 18:51:52 rpmi: liblksctp-1.0.17-alt2 1523113261 installed <13>Dec 4 18:51:52 rpmi: libsqlite3-3.33.0-alt1 sisyphus+256344.100.1.1 1597522272 installed <13>Dec 4 18:51:52 rpmi: liblcms2-2.11-alt1 sisyphus+253499.100.1.1 1592287020 installed <13>Dec 4 18:51:52 rpmi: perl-XML-NamespaceSupport-1.12-alt1 1491296348 installed <13>Dec 4 18:51:52 rpmi: lksctp-tools-1.0.17-alt2 1523113261 installed <13>Dec 4 18:51:52 rpmi: java-common-1.6.0-alt1 sisyphus+234020.100.1.1 1562437039 installed <13>Dec 4 18:51:52 rpmi: xml-utils-1:2.9.10-alt4 sisyphus+261132.100.1.1 1604669137 installed <13>Dec 4 18:51:52 rpmi: libpcsclite-1.9.0-alt1 sisyphus+253463.100.1.1 1592202070 installed <13>Dec 4 18:51:52 rpmi: javazi-2020d-alt1 sisyphus+260194.200.1.1 1603317357 installed <13>Dec 4 18:51:52 rpmi: libgif-4.1.6-alt3 1299634261 installed <13>Dec 4 18:51:52 rpmi: perl-LWP-MediaTypes-6.04-alt1 sisyphus+225468.100.1.1 1553186684 installed <13>Dec 4 18:51:52 rpmi: perl-Compress-Raw-Zlib-2.096-alt1 sisyphus+258375.500.14.2 1600904345 installed <13>Dec 4 18:51:52 rpmi: perl-libnet-1:3.11-alt1 1511423541 installed <13>Dec 4 18:51:52 rpmi: perl-XML-SAX-Base-1.09-alt1 1494364363 installed <13>Dec 4 18:51:52 rpmi: libfribidi-1.0.10-alt1 sisyphus+254557.100.1.1 1594020362 installed <13>Dec 4 18:51:52 rpmi: libepoxy-1.5.4-alt1 sisyphus+242061.100.1.1 1575190160 installed <13>Dec 4 18:51:52 rpmi: libglvnd-7:1.3.2-alt1 sisyphus+254610.100.1.1 1594124268 installed <13>Dec 4 18:51:52 rpmi: libwayland-server-1.18.0-alt1 sisyphus+255795.100.1.1 1596475648 installed <13>Dec 4 18:51:52 rpmi: libidn2-2.3.0-alt1 sisyphus+240846.100.1.2 1573870475 installed <13>Dec 4 18:51:52 rpmi: libnettle8-3.6-alt1 sisyphus+251637.100.3.1 1590060253 installed <13>Dec 4 18:51:52 rpmi: libp11-kit-0.23.15-alt2 sisyphus+252784.100.2.2 1591274901 installed <13>Dec 4 18:51:52 rpmi: libtasn1-4.16.0-alt1 sisyphus+245480.100.1.1 1580825062 installed <13>Dec 4 18:51:52 rpmi: libhogweed6-3.6-alt1 sisyphus+251637.100.3.1 1590060253 installed <13>Dec 4 18:51:52 rpmi: libgnutls30-3.6.15-alt1 sisyphus+257742.200.2.1 1599668978 installed <13>Dec 4 18:51:52 rpmi: libICE-devel-1.0.10-alt1 sisyphus+247690.100.1.1 1584000387 installed <13>Dec 4 18:51:52 rpmi: libSM-devel-1.2.3-alt1 sisyphus+226734.100.2.1 1554586158 installed <13>Dec 4 18:51:52 rpmi: libwayland-cursor-1.18.0-alt1 sisyphus+255795.100.1.1 1596475648 installed <13>Dec 4 18:51:52 rpmi: libwayland-egl-4:18.1.0-alt1 sisyphus+255795.100.1.1 1596475648 installed <13>Dec 4 18:51:52 rpmi: perl-File-Listing-6.14-alt1 sisyphus+262735.100.1.1 1606813544 installed <13>Dec 4 18:51:52 rpmi: ant-lib-0:1.10.5-alt1_5jpp8 sisyphus+232747.100.2.1 1561092977 installed <13>Dec 4 18:51:52 rpmi: apache-commons-compress-0:1.18-alt1_6jpp8 sisyphus+259620.100.1.2 1602397352 installed <13>Dec 4 18:51:52 rpmi: bcel-1:6.3.1-alt1_2jpp8 sisyphus+259662.100.1.3 1602421437 installed <13>Dec 4 18:51:52 rpmi: slf4j-0:1.7.25-alt1_6jpp8 sisyphus+234787.100.1.2 1563401783 installed <13>Dec 4 18:51:53 rpmi: zip-30000000:3.0-alt1 1332241772 installed <13>Dec 4 18:51:53 rpmi: sgml-common-0.6.3-alt15 1423664786 installed <13>Dec 4 18:51:53 rpmi: docbook-dtds-4.5-alt1 1223476557 installed <13>Dec 4 18:51:53 rpmi: docbook-style-xsl-1.79.1-alt4 sisyphus+232871.100.1.1 1561238010 installed <13>Dec 4 18:51:53 rpmi: libnatspec-0.3.1-alt2 1445691580 installed <13>Dec 4 18:51:53 rpmi: unzip-6.0-alt4 sisyphus+261685.200.2.1 1605218923 installed <13>Dec 4 18:51:53 rpmi: libgdbm-1.8.3-alt10 1454943334 installed <13>Dec 4 18:51:53 rpmi: libnspr-1:4.29-alt1 sisyphus+260224.100.2.1 1603548999 installed <13>Dec 4 18:51:53 rpmi: libgtk+2-locales-2.24.32-alt5 sisyphus+262336.100.3.1 1606161374 installed <13>Dec 4 18:51:53 rpmi: icon-theme-hicolor-0.17-alt2 sisyphus+248343.100.1.1 1584979043 installed <13>Dec 4 18:51:53 rpmi: libxkbcommon-1.0.3-alt1 sisyphus+262369.100.1.1 1606206980 installed <13>Dec 4 18:51:53 rpmi: publicsuffix-list-dafsa-20201117-alt1 sisyphus+262026.100.1.1 1605704486 installed <13>Dec 4 18:51:53 rpmi: libpsl-0.21.1-alt1 sisyphus+255206.100.1.1 1595348938 installed <13>Dec 4 18:51:53 rpmi: libverto-0.3.0-alt1_7 sisyphus+225932.100.1.1 1553994919 installed <13>Dec 4 18:51:53 rpmi: liblmdb-0.9.23-alt1 sisyphus+225277.100.2.1 1553001679 installed <13>Dec 4 18:51:53 rpmi: libkeyutils-1.6.1-alt1 sisyphus+256015.100.1.1 1596820124 installed <13>Dec 4 18:51:53 rpmi: libcom_err-1.45.6.0.24.af1a-alt1 sisyphus+262279.100.1.1 1606088229 installed <13>Dec 4 18:51:53 rpmi: libusb-1.0.23-alt1 sisyphus+237317.100.1.1 1568059905 installed <13>Dec 4 18:51:53 rpmi: libgudev-1:234-alt1 sisyphus+258314.700.14.2 1600844807 installed <13>Dec 4 18:51:53 rpmi: udev-rules-1:247-alt1 sisyphus+262610.100.3.1 1606868507 installed <13>Dec 4 18:51:53 rpmi: perl-Try-Tiny-0.30-alt1 1514318058 installed <13>Dec 4 18:51:53 rpmi: perl-IO-Socket-IP-0.41-alt1 sisyphus+259012.100.1.2 1601553446 installed <13>Dec 4 18:51:53 rpmi: perl-Compress-Raw-Bzip2-2.096-alt1 sisyphus+258375.600.14.2 1600904372 installed <13>Dec 4 18:51:53 rpmi: perl-HTML-Tagset-3.20-alt2 1317725093 installed <13>Dec 4 18:51:53 rpmi: perl-Term-ANSIColor-5.01-alt1 sisyphus+244783.100.1.2 1579747505 installed <13>Dec 4 18:51:53 rpmi: perl-Data-Dump-1.23-alt1 1444601978 installed <13>Dec 4 18:51:53 rpmi: perl-Filter-1.60-alt1 sisyphus+258375.300.14.2 1600904226 installed <13>Dec 4 18:51:53 rpmi: perl-Encode-3.07-alt1 sisyphus+258375.400.14.2 1600904306 installed <13>Dec 4 18:51:53 rpmi: perl-URI-5.05-alt1 sisyphus+260330.100.1.1 1603548554 installed <13>Dec 4 18:51:53 rpmi: perl-IO-Compress-2.096-alt1 sisyphus+257145.100.2.1 1599037634 installed <13>Dec 4 18:51:53 rpmi: perl-Net-HTTP-6.19-alt1 sisyphus+229756.100.1.1 1558454558 installed <13>Dec 4 18:51:53 rpmi: perl-HTML-Parser-3.75-alt1 sisyphus+258375.1000.14.2 1600904431 installed <13>Dec 4 18:51:53 rpmi: perl-WWW-RobotRules-6.02-alt1 1329756211 installed <13>Dec 4 18:51:53 rpmi: perl-Encode-Locale-1.05-alt1 1444608613 installed <13>Dec 4 18:51:53 rpmi: perl-IO-HTML-1.004-alt1 sisyphus+258983.100.1.1 1601542619 installed <13>Dec 4 18:51:53 rpmi: perl-HTTP-Message-6.26-alt2 sisyphus+261580.100.1.1 1605116674 installed <13>Dec 4 18:51:53 rpmi: perl-HTTP-Cookies-6.09-alt1 sisyphus+262287.100.1.1 1606090361 installed <13>Dec 4 18:51:53 rpmi: perl-HTTP-Negotiate-6.01-alt1 1329760563 installed <13>Dec 4 18:51:53 rpmi: perl-libwww-6.49-alt1 sisyphus+258986.100.1.2 1601547042 installed <13>Dec 4 18:51:53 rpmi: perl-XML-LibXML-2.0205-alt2 sisyphus+258727.100.1.2 1601156312 installed <13>Dec 4 18:51:53 rpmi: perl-XML-SAX-1.02-alt1 sisyphus+232322.100.1.1 1560758406 installed <13>Dec 4 18:51:53 rpmi: perl-XML-Simple-2.25-alt2 sisyphus+257498.100.1.1 1599324034 installed <13>Dec 4 18:51:53 rpmi: icon-naming-utils-0.8.90-alt1 1236573102 installed <13>Dec 4 18:51:54 rpmi: icon-theme-adwaita-3.38.0-alt1 sisyphus+258314.1700.14.2 1600844421 installed <13>Dec 4 18:51:54 rpmi: libdatrie-0.2.9-alt1_6 1511686676 installed <13>Dec 4 18:51:54 rpmi: libthai-0.1.28-alt1_1 sisyphus+226107.100.1.1 1554123079 installed <13>Dec 4 18:51:54 rpmi: libpixman-3:0.40.0-alt1 sisyphus+250700.100.1.1 1587971055 installed <13>Dec 4 18:51:54 rpmi: libbrotlicommon-1.0.9-alt2 sisyphus+257777.100.1.1 1599688017 installed <13>Dec 4 18:51:54 rpmi: libbrotlidec-1.0.9-alt2 sisyphus+257777.100.1.1 1599688017 installed <13>Dec 4 18:51:54 rpmi: libgraphite2-1.3.14-alt2 sisyphus+250009.100.1.1 1586943065 installed <13>Dec 4 18:51:54 rpmi: libharfbuzz-2.6.8-alt1 sisyphus+254028.100.1.1 1593106819 installed <13>Dec 4 18:51:54 rpmi: libfreetype-2.10.4-alt2 sisyphus+260293.100.2.1 1604479496 installed <13>Dec 4 18:51:54 rpmi: fontconfig-2.13.1-alt1 sisyphus+257555.100.1.1 1599475160 installed Updating fonts cache: <29>Dec 4 18:51:55 fontconfig: Updating fonts cache: succeeded [ DONE ] <13>Dec 4 18:51:55 rpmi: fonts-type1-xorg-7.0.0-alt4 1188553211 installed <13>Dec 4 18:51:56 rpmi: libxshmfence-1.3-alt1 sisyphus+223149.1000.2.1 1551268571 installed <13>Dec 4 18:51:56 rpmi: libpciaccess-1:0.16-alt1 sisyphus+234814.100.1.1 1563438291 installed <13>Dec 4 18:51:56 rpmi: libdrm-1:2.4.103-alt1 sisyphus+261080.100.1.1 1604598368 installed <13>Dec 4 18:51:56 rpmi: libgbm-4:20.2.3-alt1 sisyphus+262368.100.1.1 1606200337 installed <13>Dec 4 18:51:56 rpmi: libwebp7-1.1.0-alt1 sisyphus+243895.100.1.1 1578410873 installed <13>Dec 4 18:51:56 rpmi: libjbig-2.1-alt1 1401380926 installed <13>Dec 4 18:51:56 rpmi: libtiff5-4.1.0-alt1 sisyphus+240802.100.1.1 1573743635 installed <13>Dec 4 18:51:56 rpmi: libgdk-pixbuf-locales-2.42.0-alt1 sisyphus+261999.200.2.1 1605722003 installed <13>Dec 4 18:51:56 rpmi: gtk+3-themes-incompatible-3.20-alt3 1461944560 installed <13>Dec 4 18:51:56 rpmi: libproxy-0.4.15-alt5 sisyphus+261556.100.1.1 1605106716 installed <13>Dec 4 18:51:56 rpmi: libatk-locales-2.36.0-alt1 sisyphus+249208.100.1.1 1585840405 installed <13>Dec 4 18:51:56 rpmi: libatk-2.36.0-alt1 sisyphus+249208.100.1.1 1585840406 installed <13>Dec 4 18:51:56 rpmi: shared-mime-info-2.0-alt1 sisyphus+251302.100.1.1 1588847607 installed <13>Dec 4 18:51:56 rpmi: gsettings-desktop-schemas-data-3.38.0-alt1 sisyphus+258314.500.14.2 1600843028 installed <13>Dec 4 18:51:56 rpmi: libgio-2.66.3-alt1 sisyphus+261863.100.1.1 1605540253 installed <13>Dec 4 18:51:56 rpmi: gsettings-desktop-schemas-3.38.0-alt1 sisyphus+258314.500.14.2 1600843530 installed <13>Dec 4 18:51:56 rpmi: libgdk-pixbuf-2.42.0-alt1 sisyphus+261999.200.2.1 1605722034 installed <13>Dec 4 18:51:56 rpmi: gtk-update-icon-cache-3.24.23-alt2 sisyphus+258314.2000.14.2 1600845597 installed <13>Dec 4 18:51:56 rpmi: libgusb-0.3.5-alt1 sisyphus+255577.100.1.1 1596150494 installed <13>Dec 4 18:51:56 rpmi: libcolord-1.4.5-alt1 sisyphus+260824.100.1.1 1604332825 installed <13>Dec 4 18:51:56 rpmi: libdconf-0.38.0-alt1 sisyphus+258314.1000.14.2 1600844866 installed <13>Dec 4 18:51:56 rpmi: libjson-glib-1.6.0-alt1 sisyphus+258314.2200.14.2 1600846193 installed <13>Dec 4 18:51:56 rpmi: liblz4-1:1.9.3-alt1 sisyphus+262305.100.1.1 1606099167 installed <13>Dec 4 18:51:56 rpmi: libgpg-error-1.36-alt1 sisyphus+225621.300.1.1 1553521082 installed <13>Dec 4 18:51:56 rpmi: libgcrypt20-1.8.5-alt3 sisyphus+239622.100.1.1 1571746654 installed <13>Dec 4 18:51:56 rpmi: libsystemd-1:247-alt1 sisyphus+262610.100.3.1 1606868459 installed <13>Dec 4 18:51:56 rpmi: libdbus-1.12.18-alt1 sisyphus+252758.100.1.1 1591203693 installed <13>Dec 4 18:51:56 rpmi: dbus-tools-1.12.18-alt1 sisyphus+252758.100.1.1 1591203693 installed <86>Dec 4 18:51:56 groupadd[2664150]: group added to /etc/group: name=messagebus, GID=499 <86>Dec 4 18:51:56 groupadd[2664150]: group added to /etc/gshadow: name=messagebus <86>Dec 4 18:51:56 groupadd[2664150]: new group: name=messagebus, GID=499 <86>Dec 4 18:51:56 useradd[2664175]: new user: name=messagebus, UID=499, GID=499, home=/run/dbus, shell=/dev/null <13>Dec 4 18:51:56 rpmi: dbus-1.12.18-alt1 sisyphus+252758.100.1.1 1591203693 installed <13>Dec 4 18:51:56 rpmi: dconf-0.38.0-alt1 sisyphus+258314.1000.14.2 1600844866 installed <13>Dec 4 18:51:56 rpmi: libgtk+3-schemas-3.24.23-alt2 sisyphus+258314.2000.14.2 1600844695 installed <13>Dec 4 18:51:56 rpmi: libavahi-0.8-alt1 sisyphus+255349.240.4.1 1595604514 installed <13>Dec 4 18:51:56 rpmi: libcups-2.3.1-alt2 sisyphus+255816.100.2.1 1596533556 installed <13>Dec 4 18:51:56 rpmi: libpolkit-0.118-alt1 sisyphus+257894.100.1.1 1599828367 installed <86>Dec 4 18:51:56 groupadd[2664851]: group added to /etc/group: name=colord, GID=498 <86>Dec 4 18:51:56 groupadd[2664851]: group added to /etc/gshadow: name=colord <86>Dec 4 18:51:56 groupadd[2664851]: new group: name=colord, GID=498 <86>Dec 4 18:51:56 useradd[2664866]: new user: name=colord, UID=498, GID=498, home=/var/colord, shell=/dev/null <13>Dec 4 18:51:56 rpmi: colord-1.4.5-alt1 sisyphus+260824.100.1.1 1604332825 installed <13>Dec 4 18:51:56 rpmi: libxslt-1.1.34-alt2 sisyphus+248264.100.1.1 1584829770 installed <13>Dec 4 18:51:56 rpmi: libX11-locales-3:1.6.12-alt1 sisyphus+256796.100.1.1 1598422159 installed <13>Dec 4 18:51:56 rpmi: libXdmcp-1.1.3-alt1 sisyphus+225206.600.1.2 1552949353 installed <13>Dec 4 18:51:56 rpmi: libXau-1.0.9-alt1 sisyphus+223149.200.2.1 1551268152 installed <13>Dec 4 18:51:56 rpmi: libxcb-1.14-alt1 sisyphus+247358.200.1.3 1583854228 installed <13>Dec 4 18:51:56 rpmi: libX11-3:1.6.12-alt1 sisyphus+256796.100.1.1 1598422166 installed <13>Dec 4 18:51:56 rpmi: libXext-1.3.4-alt1 sisyphus+225206.700.1.2 1552949429 installed <13>Dec 4 18:51:56 rpmi: libXrender-0.9.10-alt1 sisyphus+261890.100.1.1 1605595177 installed <13>Dec 4 18:51:56 rpmi: libXi-1.7.10-alt1 sisyphus+232786.300.1.1 1561106978 installed <13>Dec 4 18:51:56 rpmi: libXfixes-5.0.3-alt1 sisyphus+226736.100.2.2 1554614841 installed <13>Dec 4 18:51:56 rpmi: libXcomposite-0.4.5-alt1 sisyphus+225206.300.1.2 1552949137 installed <13>Dec 4 18:51:56 rpmi: libXtst-1.2.3-alt1 sisyphus+261890.200.1.1 1605595243 installed <13>Dec 4 18:51:56 rpmi: libXdamage-1.1.5-alt1 sisyphus+225206.500.1.2 1552949286 installed <13>Dec 4 18:51:56 rpmi: libXcursor-1.2.0-alt1 sisyphus+225206.400.1.2 1552949218 installed <13>Dec 4 18:51:56 rpmi: libXrandr-1.5.2-alt1 sisyphus+225206.1300.1.2 1552949710 installed <13>Dec 4 18:51:56 rpmi: libXinerama-1.1.4-alt1 sisyphus+223149.300.2.1 1551268216 installed <13>Dec 4 18:51:56 rpmi: libat-spi2-core-2.38.0-alt1 sisyphus+258314.1440.14.2 1600845165 installed <13>Dec 4 18:51:56 rpmi: libXft-2.3.3-alt1 sisyphus+225206.1000.3.2 1552987708 installed <13>Dec 4 18:51:56 rpmi: libXxf86vm-1.1.4-alt2 1527672187 installed <13>Dec 4 18:51:56 rpmi: libGLX-mesa-4:20.2.3-alt1 sisyphus+262368.100.1.1 1606200337 installed <13>Dec 4 18:51:56 rpmi: libEGL-mesa-4:20.2.3-alt1 sisyphus+262368.100.1.1 1606200337 installed <13>Dec 4 18:51:56 rpmi: libEGL-7:1.3.2-alt1 sisyphus+254610.100.1.1 1594124268 installed <13>Dec 4 18:51:56 rpmi: libGLX-7:1.3.2-alt1 sisyphus+254610.100.1.1 1594124268 installed <13>Dec 4 18:51:56 rpmi: libGL-7:1.3.2-alt1 sisyphus+254610.100.1.1 1594124268 installed <13>Dec 4 18:51:57 rpmi: libcairo-1:1.16.0-alt1 sisyphus+226534.100.2.3 1554515535 installed <13>Dec 4 18:51:57 rpmi: libpango-1.48.0-alt1 sisyphus+261300.100.2.1 1604868816 installed <13>Dec 4 18:51:57 rpmi: libgtk+2-2.24.32-alt5 sisyphus+262336.100.3.1 1606161327 installed <13>Dec 4 18:51:57 rpmi: libgail-2.24.32-alt5 sisyphus+262336.100.3.1 1606161327 installed <13>Dec 4 18:51:57 rpmi: libcairo-gobject-1:1.16.0-alt1 sisyphus+226534.100.2.3 1554515535 installed <13>Dec 4 18:51:57 rpmi: dbus-tools-gui-1.12.18-alt1 sisyphus+252758.100.1.1 1591203693 installed <13>Dec 4 18:51:57 rpmi: at-spi2-core-2.38.0-alt1 sisyphus+258314.1440.14.2 1600845165 installed <13>Dec 4 18:51:57 rpmi: at-spi2-atk-2.38.0-alt1 sisyphus+258314.1500.14.2 1600845211 installed <13>Dec 4 18:51:57 rpmi: libXt-1.2.0-alt1 sisyphus+247690.400.1.1 1584000596 installed <13>Dec 4 18:51:58 rpmi: libxcb-devel-1.14-alt1 sisyphus+247358.200.1.3 1583854228 installed <13>Dec 4 18:51:58 rpmi: libX11-devel-3:1.6.12-alt1 sisyphus+256796.100.1.1 1598422166 installed <13>Dec 4 18:51:58 rpmi: libXt-devel-1.2.0-alt1 sisyphus+247690.400.1.1 1584000596 installed <13>Dec 4 18:51:58 rpmi: rpm-macros-alternatives-0.5.1-alt1 sisyphus+226946.100.1.1 1554830426 installed <13>Dec 4 18:51:58 rpmi: alternatives-0.5.1-alt1 sisyphus+226946.100.1.1 1554830426 installed <13>Dec 4 18:51:58 rpmi: ca-certificates-2020.10.22-alt1 sisyphus+260224.300.2.1 1603549301 installed <13>Dec 4 18:51:58 rpmi: ca-trust-0.1.2-alt1 sisyphus+233348.100.1.1 1561653823 installed <13>Dec 4 18:51:58 rpmi: p11-kit-trust-0.23.15-alt2 sisyphus+252784.100.2.2 1591274901 installed <13>Dec 4 18:51:58 rpmi: libcrypto1.1-1.1.1g-alt1 sisyphus+249982.60.8.1 1587743711 installed <13>Dec 4 18:51:59 rpmi: libssl1.1-1.1.1g-alt1 sisyphus+249982.60.8.1 1587743711 installed <13>Dec 4 18:51:59 rpmi: libpython3-3.8.6-alt1 sisyphus+259085.100.2.1 1601904174 installed <13>Dec 4 18:51:59 rpmi: python3-3.8.6-alt1 sisyphus+259085.100.2.1 1601904174 installed <13>Dec 4 18:51:59 rpmi: python3-base-3.8.6-alt1 sisyphus+259085.100.2.1 1601904174 installed <13>Dec 4 18:51:59 rpmi: python3-module-six-1.15.0-alt1 sisyphus+255738.100.2.1 1596527214 installed <13>Dec 4 18:51:59 rpmi: python3-module-sugarbowl-0.52.1-alt1.git20141130.1.1 sisyphus+227470.1100.1.1 1555687657 installed <13>Dec 4 18:51:59 rpmi: ca-trust-java-0.1.2-alt1 sisyphus+233348.100.1.1 1561653823 installed <13>Dec 4 18:51:59 rpmi: python3-module-genshi-0.7.4-alt2 sisyphus+261703.100.2.1 1605232240 installed <13>Dec 4 18:51:59 rpmi: python3-module-markupsafe-1.1.1-alt1 sisyphus+248369.100.1.1 1585046136 installed <13>Dec 4 18:51:59 rpmi: python3-module-jinja2-2.11.2-alt1 sisyphus+254573.100.1.1 1594043344 installed <13>Dec 4 18:52:00 rpmi: python3-module-clyde-0.8.0-alt1.git20141130.2.1 sisyphus+227465.1600.1.2 1555756906 installed <13>Dec 4 18:52:00 rpmi: python3-module-runfile-0.46.1-alt1.git20141130.2.2 sisyphus+260033.420.3.1 1603324221 installed <13>Dec 4 18:52:00 rpmi: objectweb-asm-0:7.0-alt1_4jpp8 sisyphus+246362.100.1.3 1581801326 installed <13>Dec 4 18:52:00 rpmi: xmvn-install-3.0.0-alt1_23jpp8 sisyphus+234592.200.1.1 1563216657 installed <13>Dec 4 18:52:00 rpmi: xmvn-subst-3.0.0-alt1_23jpp8 sisyphus+234592.200.1.1 1563216657 installed <13>Dec 4 18:52:00 rpmi: xmvn-resolve-3.0.0-alt1_23jpp8 sisyphus+234592.200.1.1 1563216657 installed <13>Dec 4 18:52:00 rpmi: xml-commons-resolver-0:1.2-alt1_29jpp8 sisyphus+246085.100.1.1 1581616616 installed <13>Dec 4 18:52:00 rpmi: xalan-j2-0:2.7.1-alt4_39jpp8 sisyphus+230759.100.1.3 1559127607 installed <13>Dec 4 18:52:00 rpmi: xerces-j2-0:2.12.0-alt1_4jpp8 sisyphus+246082.100.1.1 1581615230 installed <13>Dec 4 18:52:00 rpmi: python3-module-webencodings-0.5.1-alt2 sisyphus+245915.200.1.1 1581496105 installed <13>Dec 4 18:52:00 rpmi: python3-module-cssselect-0.9.1-alt2 sisyphus+250566.2300.6.1 1588188959 installed <13>Dec 4 18:52:00 rpmi: python3-module-html5lib-1:1.0.1-alt1 sisyphus+238807.100.2.1 1570465973 installed <13>Dec 4 18:52:00 rpmi: python3-module-lxml-4.6.1-alt2 sisyphus+261624.100.1.1 1605171595 installed <13>Dec 4 18:52:00 rpmi: python3-module-javapackages-1:5.3.0-alt1_4jpp8 sisyphus+234467.100.1.1 1563037789 installed <13>Dec 4 18:52:00 rpmi: rpm-build-java-1:5.3.0-alt1_4jpp8 sisyphus+234467.100.1.1 1563037789 installed <86>Dec 4 18:52:00 groupadd[2684294]: group added to /etc/group: name=_keytab, GID=497 <86>Dec 4 18:52:00 groupadd[2684294]: group added to /etc/gshadow: name=_keytab <86>Dec 4 18:52:00 groupadd[2684294]: new group: name=_keytab, GID=497 <13>Dec 4 18:52:00 rpmi: libkrb5-1.18.3-alt1 sisyphus+262109.100.1.1 1605777180 installed <13>Dec 4 18:52:00 rpmi: glib-networking-2.66.0-alt1 sisyphus+258314.1200.14.2 1600845027 installed <13>Dec 4 18:52:00 rpmi: libsoup-2.72.0-alt1 sisyphus+258314.1100.14.2 1600844978 installed <13>Dec 4 18:52:00 rpmi: libsoup-gnome-2.72.0-alt1 sisyphus+258314.1100.14.2 1600844978 installed <13>Dec 4 18:52:00 rpmi: librest-0.8.1-alt1 1508266400 installed <13>Dec 4 18:52:01 rpmi: libgtk+3-3.24.23-alt2 sisyphus+258314.2000.14.2 1600845597 installed <13>Dec 4 18:52:01 rpmi: gtk3-demo-3.24.23-alt2 sisyphus+258314.2000.14.2 1600845597 installed <13>Dec 4 18:52:01 rpmi: libgail3-3.24.23-alt2 sisyphus+258314.2000.14.2 1600845597 installed <13>Dec 4 18:52:01 rpmi: libnss-3.59.0-alt1 sisyphus+261953.100.4.1 1605879637 installed <13>Dec 4 18:52:04 rpmi: java-1.8.0-openjdk-headless-0:1.8.0.212.b04-alt2_0jpp8 sisyphus+255828.100.2.1 1596585346 installed <13>Dec 4 18:52:04 rpmi: java-stub-javadoc-0.1-alt1 1229813340 installed <13>Dec 4 18:52:04 rpmi: alsa-ucm-conf-1.2.4-alt1 sisyphus+260180.200.1.1 1603282405 installed <13>Dec 4 18:52:04 rpmi: alsa-topology-conf-1.2.4-alt1 sisyphus+260180.100.1.1 1603282384 installed <13>Dec 4 18:52:05 rpmi: libalsa-1:1.2.4-alt1 sisyphus+260180.300.1.1 1603282509 installed <13>Dec 4 18:52:05 rpmi: java-1.8.0-openjdk-0:1.8.0.212.b04-alt2_0jpp8 sisyphus+255828.100.2.1 1596585346 installed <13>Dec 4 18:52:05 rpmi: java-1.8.0-openjdk-devel-0:1.8.0.212.b04-alt2_0jpp8 sisyphus+255828.100.2.1 1596585346 installed <13>Dec 4 18:52:09 rpmi: java-11-openjdk-headless-0:11.0.9.7-alt1_0.0.eajpp11 sisyphus+259318.100.1.3 1602002400 installed <13>Dec 4 18:52:16 rpmi: java-11-openjdk-0:11.0.9.7-alt1_0.0.eajpp11 sisyphus+259318.100.1.3 1602002400 installed <13>Dec 4 18:52:17 rpmi: java-11-openjdk-devel-0:11.0.9.7-alt1_0.0.eajpp11 sisyphus+259318.100.1.3 1602002400 installed <13>Dec 4 18:52:17 rpmi: jpackage-generic-compat-0.30-alt1 sisyphus+234288.100.1.1 1562847521 installed <13>Dec 4 18:52:17 rpmi: javapackages-local-1:5.3.0-alt1_4jpp8 sisyphus+234467.100.1.1 1563037789 installed <13>Dec 4 18:52:17 rpmi: nekohtml-0:1.9.22-alt1_11jpp8 sisyphus+246358.100.1.1 1581799490 installed <13>Dec 4 18:52:17 rpmi: ant-0:1.10.5-alt1_5jpp8 sisyphus+232747.100.2.1 1561092977 installed Building target platforms: i586 Building for target i586 Wrote: /usr/src/in/nosrpm/boilerpipe-1.2.0-alt1_13jpp8.nosrc.rpm Installing boilerpipe-1.2.0-alt1_13jpp8.src.rpm Building target platforms: i586 Building for target i586 Executing(%prep): /bin/sh -e /usr/src/tmp/rpm-tmp.54091 + umask 022 + /bin/mkdir -p /usr/src/RPM/BUILD + cd /usr/src/RPM/BUILD + cd /usr/src/RPM/BUILD + rm -rf boilerpipe-1.2.0 + echo 'Source #0 (boilerpipe-1.2.0-src.tar.gz):' Source #0 (boilerpipe-1.2.0-src.tar.gz): + /bin/tar -xf - + /bin/gzip -dc /usr/src/RPM/SOURCES/boilerpipe-1.2.0-src.tar.gz + cd boilerpipe-1.2.0 + /bin/chmod -c -Rf u+rwX,go-w . + find . -iname '*.jar' -delete + find . -iname '*.class' -delete + echo 'Patch #0 (boilerpipe-1.2.0-libdir-patch):' Patch #0 (boilerpipe-1.2.0-libdir-patch): + /usr/bin/patch -p0 patching file build.xml + cp /usr/src/RPM/SOURCES/boilerpipe-1.2.0.pom pom.xml + echo 'Patch #1 (boilerpipe-1.2.0-nekohtml-patch):' Patch #1 (boilerpipe-1.2.0-nekohtml-patch): + /usr/bin/patch -p1 patching file pom.xml patching file src/main/org/cyberneko/html/HTMLElements.java patching file src/main/org/cyberneko/html/HTMLTagBalancer.java + for s in src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeFilter.java src/main/de/l3s/boilerpipe/BoilerpipeExtractor.java src/main/de/l3s/boilerpipe/BoilerpipeProcessingException.java src/main/de/l3s/boilerpipe/conditions/TextBlockCondition.java src/main/de/l3s/boilerpipe/document/TextBlock.java src/main/de/l3s/boilerpipe/document/TextDocumentStatistics.java src/main/de/l3s/boilerpipe/document/TextDocument.java src/main/de/l3s/boilerpipe/estimators/SimpleEstimator.java src/main/de/l3s/boilerpipe/extractors/LargestContentExtractor.java src/main/de/l3s/boilerpipe/extractors/DefaultExtractor.java src/main/de/l3s/boilerpipe/extractors/NumWordsRulesExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingWithMinKWordsExtractor.java src/main/de/l3s/boilerpipe/extractors/ExtractorBase.java src/main/de/l3s/boilerpipe/extractors/ArticleSentencesExtractor.java src/main/de/l3s/boilerpipe/extractors/CommonExtractors.java src/main/de/l3s/boilerpipe/extractors/CanolaExtractor.java src/main/de/l3s/boilerpipe/extractors/ArticleExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingExtractor.java src/main/de/l3s/boilerpipe/filters/english/HeuristicFilterBase.java src/main/de/l3s/boilerpipe/filters/english/KeepLargestFulltextBlockFilter.java src/main/de/l3s/boilerpipe/filters/english/TerminatingBlocksFinder.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFilter.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFromEndFilter.java src/main/de/l3s/boilerpipe/filters/english/DensityRulesClassifier.java src/main/de/l3s/boilerpipe/filters/english/MinFulltextWordsFilter.java src/main/de/l3s/boilerpipe/filters/english/NumWordsRulesClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/SimpleBlockFusionProcessor.java src/main/de/l3s/boilerpipe/filters/heuristics/BlockProximityFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/KeepLargestBlockFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/DocumentTitleMatchClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/LabelFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/AddPrecedingLabelsFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ExpandTitleToContentFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ContentFusion.java src/main/de/l3s/boilerpipe/filters/simple/MinWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToBoilerplateFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToContentFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/MinClauseWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/BoilerplateBlockFilter.java src/main/de/l3s/boilerpipe/filters/simple/SplitParagraphBlocksFilter.java src/main/de/l3s/boilerpipe/filters/simple/MarkEverythingContentFilter.java src/main/de/l3s/boilerpipe/labels/DefaultLabels.java src/main/de/l3s/boilerpipe/labels/ConditionalLabelAction.java src/main/de/l3s/boilerpipe/labels/LabelAction.java src/main/de/l3s/boilerpipe/sax/BoilerpipeSAXInput.java src/main/de/l3s/boilerpipe/sax/HTMLHighlighter.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLContentHandler.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLParser.java src/main/de/l3s/boilerpipe/sax/TagActionMap.java src/main/de/l3s/boilerpipe/sax/InputSourceable.java src/main/de/l3s/boilerpipe/sax/HTMLDocument.java src/main/de/l3s/boilerpipe/sax/CommonTagActions.java src/main/de/l3s/boilerpipe/sax/DefaultTagActionMap.java src/main/de/l3s/boilerpipe/sax/HTMLFetcher.java src/main/de/l3s/boilerpipe/sax/TagAction.java src/main/de/l3s/boilerpipe/sax/MarkupTagAction.java src/main/de/l3s/boilerpipe/util/UnicodeTokenizer.java + native2ascii -encoding UTF8 src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeInput.java + for s in src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeFilter.java src/main/de/l3s/boilerpipe/BoilerpipeExtractor.java src/main/de/l3s/boilerpipe/BoilerpipeProcessingException.java src/main/de/l3s/boilerpipe/conditions/TextBlockCondition.java src/main/de/l3s/boilerpipe/document/TextBlock.java src/main/de/l3s/boilerpipe/document/TextDocumentStatistics.java src/main/de/l3s/boilerpipe/document/TextDocument.java src/main/de/l3s/boilerpipe/estimators/SimpleEstimator.java src/main/de/l3s/boilerpipe/extractors/LargestContentExtractor.java src/main/de/l3s/boilerpipe/extractors/DefaultExtractor.java src/main/de/l3s/boilerpipe/extractors/NumWordsRulesExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingWithMinKWordsExtractor.java src/main/de/l3s/boilerpipe/extractors/ExtractorBase.java src/main/de/l3s/boilerpipe/extractors/ArticleSentencesExtractor.java src/main/de/l3s/boilerpipe/extractors/CommonExtractors.java src/main/de/l3s/boilerpipe/extractors/CanolaExtractor.java src/main/de/l3s/boilerpipe/extractors/ArticleExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingExtractor.java src/main/de/l3s/boilerpipe/filters/english/HeuristicFilterBase.java src/main/de/l3s/boilerpipe/filters/english/KeepLargestFulltextBlockFilter.java src/main/de/l3s/boilerpipe/filters/english/TerminatingBlocksFinder.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFilter.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFromEndFilter.java src/main/de/l3s/boilerpipe/filters/english/DensityRulesClassifier.java src/main/de/l3s/boilerpipe/filters/english/MinFulltextWordsFilter.java src/main/de/l3s/boilerpipe/filters/english/NumWordsRulesClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/SimpleBlockFusionProcessor.java src/main/de/l3s/boilerpipe/filters/heuristics/BlockProximityFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/KeepLargestBlockFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/DocumentTitleMatchClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/LabelFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/AddPrecedingLabelsFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ExpandTitleToContentFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ContentFusion.java src/main/de/l3s/boilerpipe/filters/simple/MinWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToBoilerplateFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToContentFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/MinClauseWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/BoilerplateBlockFilter.java src/main/de/l3s/boilerpipe/filters/simple/SplitParagraphBlocksFilter.java src/main/de/l3s/boilerpipe/filters/simple/MarkEverythingContentFilter.java src/main/de/l3s/boilerpipe/labels/DefaultLabels.java src/main/de/l3s/boilerpipe/labels/ConditionalLabelAction.java src/main/de/l3s/boilerpipe/labels/LabelAction.java src/main/de/l3s/boilerpipe/sax/BoilerpipeSAXInput.java src/main/de/l3s/boilerpipe/sax/HTMLHighlighter.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLContentHandler.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLParser.java src/main/de/l3s/boilerpipe/sax/TagActionMap.java src/main/de/l3s/boilerpipe/sax/InputSourceable.java src/main/de/l3s/boilerpipe/sax/HTMLDocument.java src/main/de/l3s/boilerpipe/sax/CommonTagActions.java src/main/de/l3s/boilerpipe/sax/DefaultTagActionMap.java src/main/de/l3s/boilerpipe/sax/HTMLFetcher.java src/main/de/l3s/boilerpipe/sax/TagAction.java src/main/de/l3s/boilerpipe/sax/MarkupTagAction.java src/main/de/l3s/boilerpipe/util/UnicodeTokenizer.java + native2ascii -encoding UTF8 src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeInput.java + for s in src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeFilter.java src/main/de/l3s/boilerpipe/BoilerpipeExtractor.java src/main/de/l3s/boilerpipe/BoilerpipeProcessingException.java src/main/de/l3s/boilerpipe/conditions/TextBlockCondition.java src/main/de/l3s/boilerpipe/document/TextBlock.java src/main/de/l3s/boilerpipe/document/TextDocumentStatistics.java src/main/de/l3s/boilerpipe/document/TextDocument.java src/main/de/l3s/boilerpipe/estimators/SimpleEstimator.java src/main/de/l3s/boilerpipe/extractors/LargestContentExtractor.java src/main/de/l3s/boilerpipe/extractors/DefaultExtractor.java src/main/de/l3s/boilerpipe/extractors/NumWordsRulesExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingWithMinKWordsExtractor.java src/main/de/l3s/boilerpipe/extractors/ExtractorBase.java src/main/de/l3s/boilerpipe/extractors/ArticleSentencesExtractor.java src/main/de/l3s/boilerpipe/extractors/CommonExtractors.java src/main/de/l3s/boilerpipe/extractors/CanolaExtractor.java src/main/de/l3s/boilerpipe/extractors/ArticleExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingExtractor.java src/main/de/l3s/boilerpipe/filters/english/HeuristicFilterBase.java src/main/de/l3s/boilerpipe/filters/english/KeepLargestFulltextBlockFilter.java src/main/de/l3s/boilerpipe/filters/english/TerminatingBlocksFinder.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFilter.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFromEndFilter.java src/main/de/l3s/boilerpipe/filters/english/DensityRulesClassifier.java src/main/de/l3s/boilerpipe/filters/english/MinFulltextWordsFilter.java src/main/de/l3s/boilerpipe/filters/english/NumWordsRulesClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/SimpleBlockFusionProcessor.java src/main/de/l3s/boilerpipe/filters/heuristics/BlockProximityFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/KeepLargestBlockFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/DocumentTitleMatchClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/LabelFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/AddPrecedingLabelsFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ExpandTitleToContentFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ContentFusion.java src/main/de/l3s/boilerpipe/filters/simple/MinWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToBoilerplateFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToContentFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/MinClauseWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/BoilerplateBlockFilter.java src/main/de/l3s/boilerpipe/filters/simple/SplitParagraphBlocksFilter.java src/main/de/l3s/boilerpipe/filters/simple/MarkEverythingContentFilter.java src/main/de/l3s/boilerpipe/labels/DefaultLabels.java src/main/de/l3s/boilerpipe/labels/ConditionalLabelAction.java src/main/de/l3s/boilerpipe/labels/LabelAction.java src/main/de/l3s/boilerpipe/sax/BoilerpipeSAXInput.java src/main/de/l3s/boilerpipe/sax/HTMLHighlighter.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLContentHandler.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLParser.java src/main/de/l3s/boilerpipe/sax/TagActionMap.java src/main/de/l3s/boilerpipe/sax/InputSourceable.java src/main/de/l3s/boilerpipe/sax/HTMLDocument.java src/main/de/l3s/boilerpipe/sax/CommonTagActions.java src/main/de/l3s/boilerpipe/sax/DefaultTagActionMap.java src/main/de/l3s/boilerpipe/sax/HTMLFetcher.java src/main/de/l3s/boilerpipe/sax/TagAction.java src/main/de/l3s/boilerpipe/sax/MarkupTagAction.java src/main/de/l3s/boilerpipe/util/UnicodeTokenizer.java + native2ascii -encoding UTF8 src/main/de/l3s/boilerpipe/BoilerpipeFilter.java src/main/de/l3s/boilerpipe/BoilerpipeFilter.java + for s in src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeFilter.java src/main/de/l3s/boilerpipe/BoilerpipeExtractor.java src/main/de/l3s/boilerpipe/BoilerpipeProcessingException.java src/main/de/l3s/boilerpipe/conditions/TextBlockCondition.java src/main/de/l3s/boilerpipe/document/TextBlock.java src/main/de/l3s/boilerpipe/document/TextDocumentStatistics.java src/main/de/l3s/boilerpipe/document/TextDocument.java src/main/de/l3s/boilerpipe/estimators/SimpleEstimator.java src/main/de/l3s/boilerpipe/extractors/LargestContentExtractor.java src/main/de/l3s/boilerpipe/extractors/DefaultExtractor.java src/main/de/l3s/boilerpipe/extractors/NumWordsRulesExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingWithMinKWordsExtractor.java src/main/de/l3s/boilerpipe/extractors/ExtractorBase.java src/main/de/l3s/boilerpipe/extractors/ArticleSentencesExtractor.java src/main/de/l3s/boilerpipe/extractors/CommonExtractors.java src/main/de/l3s/boilerpipe/extractors/CanolaExtractor.java src/main/de/l3s/boilerpipe/extractors/ArticleExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingExtractor.java src/main/de/l3s/boilerpipe/filters/english/HeuristicFilterBase.java src/main/de/l3s/boilerpipe/filters/english/KeepLargestFulltextBlockFilter.java src/main/de/l3s/boilerpipe/filters/english/TerminatingBlocksFinder.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFilter.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFromEndFilter.java src/main/de/l3s/boilerpipe/filters/english/DensityRulesClassifier.java src/main/de/l3s/boilerpipe/filters/english/MinFulltextWordsFilter.java src/main/de/l3s/boilerpipe/filters/english/NumWordsRulesClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/SimpleBlockFusionProcessor.java src/main/de/l3s/boilerpipe/filters/heuristics/BlockProximityFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/KeepLargestBlockFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/DocumentTitleMatchClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/LabelFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/AddPrecedingLabelsFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ExpandTitleToContentFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ContentFusion.java src/main/de/l3s/boilerpipe/filters/simple/MinWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToBoilerplateFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToContentFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/MinClauseWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/BoilerplateBlockFilter.java src/main/de/l3s/boilerpipe/filters/simple/SplitParagraphBlocksFilter.java src/main/de/l3s/boilerpipe/filters/simple/MarkEverythingContentFilter.java src/main/de/l3s/boilerpipe/labels/DefaultLabels.java src/main/de/l3s/boilerpipe/labels/ConditionalLabelAction.java src/main/de/l3s/boilerpipe/labels/LabelAction.java src/main/de/l3s/boilerpipe/sax/BoilerpipeSAXInput.java src/main/de/l3s/boilerpipe/sax/HTMLHighlighter.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLContentHandler.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLParser.java src/main/de/l3s/boilerpipe/sax/TagActionMap.java src/main/de/l3s/boilerpipe/sax/InputSourceable.java src/main/de/l3s/boilerpipe/sax/HTMLDocument.java src/main/de/l3s/boilerpipe/sax/CommonTagActions.java src/main/de/l3s/boilerpipe/sax/DefaultTagActionMap.java src/main/de/l3s/boilerpipe/sax/HTMLFetcher.java src/main/de/l3s/boilerpipe/sax/TagAction.java src/main/de/l3s/boilerpipe/sax/MarkupTagAction.java src/main/de/l3s/boilerpipe/util/UnicodeTokenizer.java + native2ascii -encoding UTF8 src/main/de/l3s/boilerpipe/BoilerpipeExtractor.java src/main/de/l3s/boilerpipe/BoilerpipeExtractor.java + for s in src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeFilter.java src/main/de/l3s/boilerpipe/BoilerpipeExtractor.java src/main/de/l3s/boilerpipe/BoilerpipeProcessingException.java src/main/de/l3s/boilerpipe/conditions/TextBlockCondition.java src/main/de/l3s/boilerpipe/document/TextBlock.java src/main/de/l3s/boilerpipe/document/TextDocumentStatistics.java src/main/de/l3s/boilerpipe/document/TextDocument.java src/main/de/l3s/boilerpipe/estimators/SimpleEstimator.java src/main/de/l3s/boilerpipe/extractors/LargestContentExtractor.java src/main/de/l3s/boilerpipe/extractors/DefaultExtractor.java src/main/de/l3s/boilerpipe/extractors/NumWordsRulesExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingWithMinKWordsExtractor.java src/main/de/l3s/boilerpipe/extractors/ExtractorBase.java src/main/de/l3s/boilerpipe/extractors/ArticleSentencesExtractor.java src/main/de/l3s/boilerpipe/extractors/CommonExtractors.java src/main/de/l3s/boilerpipe/extractors/CanolaExtractor.java src/main/de/l3s/boilerpipe/extractors/ArticleExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingExtractor.java src/main/de/l3s/boilerpipe/filters/english/HeuristicFilterBase.java src/main/de/l3s/boilerpipe/filters/english/KeepLargestFulltextBlockFilter.java src/main/de/l3s/boilerpipe/filters/english/TerminatingBlocksFinder.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFilter.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFromEndFilter.java src/main/de/l3s/boilerpipe/filters/english/DensityRulesClassifier.java src/main/de/l3s/boilerpipe/filters/english/MinFulltextWordsFilter.java src/main/de/l3s/boilerpipe/filters/english/NumWordsRulesClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/SimpleBlockFusionProcessor.java src/main/de/l3s/boilerpipe/filters/heuristics/BlockProximityFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/KeepLargestBlockFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/DocumentTitleMatchClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/LabelFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/AddPrecedingLabelsFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ExpandTitleToContentFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ContentFusion.java src/main/de/l3s/boilerpipe/filters/simple/MinWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToBoilerplateFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToContentFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/MinClauseWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/BoilerplateBlockFilter.java src/main/de/l3s/boilerpipe/filters/simple/SplitParagraphBlocksFilter.java src/main/de/l3s/boilerpipe/filters/simple/MarkEverythingContentFilter.java src/main/de/l3s/boilerpipe/labels/DefaultLabels.java src/main/de/l3s/boilerpipe/labels/ConditionalLabelAction.java src/main/de/l3s/boilerpipe/labels/LabelAction.java src/main/de/l3s/boilerpipe/sax/BoilerpipeSAXInput.java src/main/de/l3s/boilerpipe/sax/HTMLHighlighter.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLContentHandler.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLParser.java src/main/de/l3s/boilerpipe/sax/TagActionMap.java src/main/de/l3s/boilerpipe/sax/InputSourceable.java src/main/de/l3s/boilerpipe/sax/HTMLDocument.java src/main/de/l3s/boilerpipe/sax/CommonTagActions.java src/main/de/l3s/boilerpipe/sax/DefaultTagActionMap.java src/main/de/l3s/boilerpipe/sax/HTMLFetcher.java src/main/de/l3s/boilerpipe/sax/TagAction.java src/main/de/l3s/boilerpipe/sax/MarkupTagAction.java src/main/de/l3s/boilerpipe/util/UnicodeTokenizer.java + native2ascii -encoding UTF8 src/main/de/l3s/boilerpipe/BoilerpipeProcessingException.java src/main/de/l3s/boilerpipe/BoilerpipeProcessingException.java + for s in src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeFilter.java src/main/de/l3s/boilerpipe/BoilerpipeExtractor.java src/main/de/l3s/boilerpipe/BoilerpipeProcessingException.java src/main/de/l3s/boilerpipe/conditions/TextBlockCondition.java src/main/de/l3s/boilerpipe/document/TextBlock.java src/main/de/l3s/boilerpipe/document/TextDocumentStatistics.java src/main/de/l3s/boilerpipe/document/TextDocument.java src/main/de/l3s/boilerpipe/estimators/SimpleEstimator.java src/main/de/l3s/boilerpipe/extractors/LargestContentExtractor.java src/main/de/l3s/boilerpipe/extractors/DefaultExtractor.java src/main/de/l3s/boilerpipe/extractors/NumWordsRulesExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingWithMinKWordsExtractor.java src/main/de/l3s/boilerpipe/extractors/ExtractorBase.java src/main/de/l3s/boilerpipe/extractors/ArticleSentencesExtractor.java src/main/de/l3s/boilerpipe/extractors/CommonExtractors.java src/main/de/l3s/boilerpipe/extractors/CanolaExtractor.java src/main/de/l3s/boilerpipe/extractors/ArticleExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingExtractor.java src/main/de/l3s/boilerpipe/filters/english/HeuristicFilterBase.java src/main/de/l3s/boilerpipe/filters/english/KeepLargestFulltextBlockFilter.java src/main/de/l3s/boilerpipe/filters/english/TerminatingBlocksFinder.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFilter.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFromEndFilter.java src/main/de/l3s/boilerpipe/filters/english/DensityRulesClassifier.java src/main/de/l3s/boilerpipe/filters/english/MinFulltextWordsFilter.java src/main/de/l3s/boilerpipe/filters/english/NumWordsRulesClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/SimpleBlockFusionProcessor.java src/main/de/l3s/boilerpipe/filters/heuristics/BlockProximityFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/KeepLargestBlockFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/DocumentTitleMatchClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/LabelFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/AddPrecedingLabelsFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ExpandTitleToContentFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ContentFusion.java src/main/de/l3s/boilerpipe/filters/simple/MinWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToBoilerplateFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToContentFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/MinClauseWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/BoilerplateBlockFilter.java src/main/de/l3s/boilerpipe/filters/simple/SplitParagraphBlocksFilter.java src/main/de/l3s/boilerpipe/filters/simple/MarkEverythingContentFilter.java src/main/de/l3s/boilerpipe/labels/DefaultLabels.java src/main/de/l3s/boilerpipe/labels/ConditionalLabelAction.java src/main/de/l3s/boilerpipe/labels/LabelAction.java src/main/de/l3s/boilerpipe/sax/BoilerpipeSAXInput.java src/main/de/l3s/boilerpipe/sax/HTMLHighlighter.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLContentHandler.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLParser.java src/main/de/l3s/boilerpipe/sax/TagActionMap.java src/main/de/l3s/boilerpipe/sax/InputSourceable.java src/main/de/l3s/boilerpipe/sax/HTMLDocument.java src/main/de/l3s/boilerpipe/sax/CommonTagActions.java src/main/de/l3s/boilerpipe/sax/DefaultTagActionMap.java src/main/de/l3s/boilerpipe/sax/HTMLFetcher.java src/main/de/l3s/boilerpipe/sax/TagAction.java src/main/de/l3s/boilerpipe/sax/MarkupTagAction.java src/main/de/l3s/boilerpipe/util/UnicodeTokenizer.java + native2ascii -encoding UTF8 src/main/de/l3s/boilerpipe/conditions/TextBlockCondition.java src/main/de/l3s/boilerpipe/conditions/TextBlockCondition.java + for s in src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeFilter.java src/main/de/l3s/boilerpipe/BoilerpipeExtractor.java src/main/de/l3s/boilerpipe/BoilerpipeProcessingException.java src/main/de/l3s/boilerpipe/conditions/TextBlockCondition.java src/main/de/l3s/boilerpipe/document/TextBlock.java src/main/de/l3s/boilerpipe/document/TextDocumentStatistics.java src/main/de/l3s/boilerpipe/document/TextDocument.java src/main/de/l3s/boilerpipe/estimators/SimpleEstimator.java src/main/de/l3s/boilerpipe/extractors/LargestContentExtractor.java src/main/de/l3s/boilerpipe/extractors/DefaultExtractor.java src/main/de/l3s/boilerpipe/extractors/NumWordsRulesExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingWithMinKWordsExtractor.java src/main/de/l3s/boilerpipe/extractors/ExtractorBase.java src/main/de/l3s/boilerpipe/extractors/ArticleSentencesExtractor.java src/main/de/l3s/boilerpipe/extractors/CommonExtractors.java src/main/de/l3s/boilerpipe/extractors/CanolaExtractor.java src/main/de/l3s/boilerpipe/extractors/ArticleExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingExtractor.java src/main/de/l3s/boilerpipe/filters/english/HeuristicFilterBase.java src/main/de/l3s/boilerpipe/filters/english/KeepLargestFulltextBlockFilter.java src/main/de/l3s/boilerpipe/filters/english/TerminatingBlocksFinder.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFilter.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFromEndFilter.java src/main/de/l3s/boilerpipe/filters/english/DensityRulesClassifier.java src/main/de/l3s/boilerpipe/filters/english/MinFulltextWordsFilter.java src/main/de/l3s/boilerpipe/filters/english/NumWordsRulesClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/SimpleBlockFusionProcessor.java src/main/de/l3s/boilerpipe/filters/heuristics/BlockProximityFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/KeepLargestBlockFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/DocumentTitleMatchClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/LabelFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/AddPrecedingLabelsFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ExpandTitleToContentFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ContentFusion.java src/main/de/l3s/boilerpipe/filters/simple/MinWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToBoilerplateFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToContentFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/MinClauseWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/BoilerplateBlockFilter.java src/main/de/l3s/boilerpipe/filters/simple/SplitParagraphBlocksFilter.java src/main/de/l3s/boilerpipe/filters/simple/MarkEverythingContentFilter.java src/main/de/l3s/boilerpipe/labels/DefaultLabels.java src/main/de/l3s/boilerpipe/labels/ConditionalLabelAction.java src/main/de/l3s/boilerpipe/labels/LabelAction.java src/main/de/l3s/boilerpipe/sax/BoilerpipeSAXInput.java src/main/de/l3s/boilerpipe/sax/HTMLHighlighter.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLContentHandler.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLParser.java src/main/de/l3s/boilerpipe/sax/TagActionMap.java src/main/de/l3s/boilerpipe/sax/InputSourceable.java src/main/de/l3s/boilerpipe/sax/HTMLDocument.java src/main/de/l3s/boilerpipe/sax/CommonTagActions.java src/main/de/l3s/boilerpipe/sax/DefaultTagActionMap.java src/main/de/l3s/boilerpipe/sax/HTMLFetcher.java src/main/de/l3s/boilerpipe/sax/TagAction.java src/main/de/l3s/boilerpipe/sax/MarkupTagAction.java src/main/de/l3s/boilerpipe/util/UnicodeTokenizer.java + native2ascii -encoding UTF8 src/main/de/l3s/boilerpipe/document/TextBlock.java src/main/de/l3s/boilerpipe/document/TextBlock.java + for s in src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeFilter.java src/main/de/l3s/boilerpipe/BoilerpipeExtractor.java src/main/de/l3s/boilerpipe/BoilerpipeProcessingException.java src/main/de/l3s/boilerpipe/conditions/TextBlockCondition.java src/main/de/l3s/boilerpipe/document/TextBlock.java src/main/de/l3s/boilerpipe/document/TextDocumentStatistics.java src/main/de/l3s/boilerpipe/document/TextDocument.java src/main/de/l3s/boilerpipe/estimators/SimpleEstimator.java src/main/de/l3s/boilerpipe/extractors/LargestContentExtractor.java src/main/de/l3s/boilerpipe/extractors/DefaultExtractor.java src/main/de/l3s/boilerpipe/extractors/NumWordsRulesExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingWithMinKWordsExtractor.java src/main/de/l3s/boilerpipe/extractors/ExtractorBase.java src/main/de/l3s/boilerpipe/extractors/ArticleSentencesExtractor.java src/main/de/l3s/boilerpipe/extractors/CommonExtractors.java src/main/de/l3s/boilerpipe/extractors/CanolaExtractor.java src/main/de/l3s/boilerpipe/extractors/ArticleExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingExtractor.java src/main/de/l3s/boilerpipe/filters/english/HeuristicFilterBase.java src/main/de/l3s/boilerpipe/filters/english/KeepLargestFulltextBlockFilter.java src/main/de/l3s/boilerpipe/filters/english/TerminatingBlocksFinder.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFilter.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFromEndFilter.java src/main/de/l3s/boilerpipe/filters/english/DensityRulesClassifier.java src/main/de/l3s/boilerpipe/filters/english/MinFulltextWordsFilter.java src/main/de/l3s/boilerpipe/filters/english/NumWordsRulesClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/SimpleBlockFusionProcessor.java src/main/de/l3s/boilerpipe/filters/heuristics/BlockProximityFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/KeepLargestBlockFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/DocumentTitleMatchClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/LabelFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/AddPrecedingLabelsFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ExpandTitleToContentFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ContentFusion.java src/main/de/l3s/boilerpipe/filters/simple/MinWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToBoilerplateFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToContentFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/MinClauseWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/BoilerplateBlockFilter.java src/main/de/l3s/boilerpipe/filters/simple/SplitParagraphBlocksFilter.java src/main/de/l3s/boilerpipe/filters/simple/MarkEverythingContentFilter.java src/main/de/l3s/boilerpipe/labels/DefaultLabels.java src/main/de/l3s/boilerpipe/labels/ConditionalLabelAction.java src/main/de/l3s/boilerpipe/labels/LabelAction.java src/main/de/l3s/boilerpipe/sax/BoilerpipeSAXInput.java src/main/de/l3s/boilerpipe/sax/HTMLHighlighter.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLContentHandler.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLParser.java src/main/de/l3s/boilerpipe/sax/TagActionMap.java src/main/de/l3s/boilerpipe/sax/InputSourceable.java src/main/de/l3s/boilerpipe/sax/HTMLDocument.java src/main/de/l3s/boilerpipe/sax/CommonTagActions.java src/main/de/l3s/boilerpipe/sax/DefaultTagActionMap.java src/main/de/l3s/boilerpipe/sax/HTMLFetcher.java src/main/de/l3s/boilerpipe/sax/TagAction.java src/main/de/l3s/boilerpipe/sax/MarkupTagAction.java src/main/de/l3s/boilerpipe/util/UnicodeTokenizer.java + native2ascii -encoding UTF8 src/main/de/l3s/boilerpipe/document/TextDocumentStatistics.java src/main/de/l3s/boilerpipe/document/TextDocumentStatistics.java + for s in src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeFilter.java src/main/de/l3s/boilerpipe/BoilerpipeExtractor.java src/main/de/l3s/boilerpipe/BoilerpipeProcessingException.java src/main/de/l3s/boilerpipe/conditions/TextBlockCondition.java src/main/de/l3s/boilerpipe/document/TextBlock.java src/main/de/l3s/boilerpipe/document/TextDocumentStatistics.java src/main/de/l3s/boilerpipe/document/TextDocument.java src/main/de/l3s/boilerpipe/estimators/SimpleEstimator.java src/main/de/l3s/boilerpipe/extractors/LargestContentExtractor.java src/main/de/l3s/boilerpipe/extractors/DefaultExtractor.java src/main/de/l3s/boilerpipe/extractors/NumWordsRulesExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingWithMinKWordsExtractor.java src/main/de/l3s/boilerpipe/extractors/ExtractorBase.java src/main/de/l3s/boilerpipe/extractors/ArticleSentencesExtractor.java src/main/de/l3s/boilerpipe/extractors/CommonExtractors.java src/main/de/l3s/boilerpipe/extractors/CanolaExtractor.java src/main/de/l3s/boilerpipe/extractors/ArticleExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingExtractor.java src/main/de/l3s/boilerpipe/filters/english/HeuristicFilterBase.java src/main/de/l3s/boilerpipe/filters/english/KeepLargestFulltextBlockFilter.java src/main/de/l3s/boilerpipe/filters/english/TerminatingBlocksFinder.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFilter.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFromEndFilter.java src/main/de/l3s/boilerpipe/filters/english/DensityRulesClassifier.java src/main/de/l3s/boilerpipe/filters/english/MinFulltextWordsFilter.java src/main/de/l3s/boilerpipe/filters/english/NumWordsRulesClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/SimpleBlockFusionProcessor.java src/main/de/l3s/boilerpipe/filters/heuristics/BlockProximityFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/KeepLargestBlockFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/DocumentTitleMatchClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/LabelFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/AddPrecedingLabelsFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ExpandTitleToContentFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ContentFusion.java src/main/de/l3s/boilerpipe/filters/simple/MinWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToBoilerplateFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToContentFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/MinClauseWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/BoilerplateBlockFilter.java src/main/de/l3s/boilerpipe/filters/simple/SplitParagraphBlocksFilter.java src/main/de/l3s/boilerpipe/filters/simple/MarkEverythingContentFilter.java src/main/de/l3s/boilerpipe/labels/DefaultLabels.java src/main/de/l3s/boilerpipe/labels/ConditionalLabelAction.java src/main/de/l3s/boilerpipe/labels/LabelAction.java src/main/de/l3s/boilerpipe/sax/BoilerpipeSAXInput.java src/main/de/l3s/boilerpipe/sax/HTMLHighlighter.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLContentHandler.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLParser.java src/main/de/l3s/boilerpipe/sax/TagActionMap.java src/main/de/l3s/boilerpipe/sax/InputSourceable.java src/main/de/l3s/boilerpipe/sax/HTMLDocument.java src/main/de/l3s/boilerpipe/sax/CommonTagActions.java src/main/de/l3s/boilerpipe/sax/DefaultTagActionMap.java src/main/de/l3s/boilerpipe/sax/HTMLFetcher.java src/main/de/l3s/boilerpipe/sax/TagAction.java src/main/de/l3s/boilerpipe/sax/MarkupTagAction.java src/main/de/l3s/boilerpipe/util/UnicodeTokenizer.java + native2ascii -encoding UTF8 src/main/de/l3s/boilerpipe/document/TextDocument.java src/main/de/l3s/boilerpipe/document/TextDocument.java + for s in src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeFilter.java src/main/de/l3s/boilerpipe/BoilerpipeExtractor.java src/main/de/l3s/boilerpipe/BoilerpipeProcessingException.java src/main/de/l3s/boilerpipe/conditions/TextBlockCondition.java src/main/de/l3s/boilerpipe/document/TextBlock.java src/main/de/l3s/boilerpipe/document/TextDocumentStatistics.java src/main/de/l3s/boilerpipe/document/TextDocument.java src/main/de/l3s/boilerpipe/estimators/SimpleEstimator.java src/main/de/l3s/boilerpipe/extractors/LargestContentExtractor.java src/main/de/l3s/boilerpipe/extractors/DefaultExtractor.java src/main/de/l3s/boilerpipe/extractors/NumWordsRulesExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingWithMinKWordsExtractor.java src/main/de/l3s/boilerpipe/extractors/ExtractorBase.java src/main/de/l3s/boilerpipe/extractors/ArticleSentencesExtractor.java src/main/de/l3s/boilerpipe/extractors/CommonExtractors.java src/main/de/l3s/boilerpipe/extractors/CanolaExtractor.java src/main/de/l3s/boilerpipe/extractors/ArticleExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingExtractor.java src/main/de/l3s/boilerpipe/filters/english/HeuristicFilterBase.java src/main/de/l3s/boilerpipe/filters/english/KeepLargestFulltextBlockFilter.java src/main/de/l3s/boilerpipe/filters/english/TerminatingBlocksFinder.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFilter.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFromEndFilter.java src/main/de/l3s/boilerpipe/filters/english/DensityRulesClassifier.java src/main/de/l3s/boilerpipe/filters/english/MinFulltextWordsFilter.java src/main/de/l3s/boilerpipe/filters/english/NumWordsRulesClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/SimpleBlockFusionProcessor.java src/main/de/l3s/boilerpipe/filters/heuristics/BlockProximityFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/KeepLargestBlockFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/DocumentTitleMatchClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/LabelFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/AddPrecedingLabelsFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ExpandTitleToContentFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ContentFusion.java src/main/de/l3s/boilerpipe/filters/simple/MinWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToBoilerplateFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToContentFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/MinClauseWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/BoilerplateBlockFilter.java src/main/de/l3s/boilerpipe/filters/simple/SplitParagraphBlocksFilter.java src/main/de/l3s/boilerpipe/filters/simple/MarkEverythingContentFilter.java src/main/de/l3s/boilerpipe/labels/DefaultLabels.java src/main/de/l3s/boilerpipe/labels/ConditionalLabelAction.java src/main/de/l3s/boilerpipe/labels/LabelAction.java src/main/de/l3s/boilerpipe/sax/BoilerpipeSAXInput.java src/main/de/l3s/boilerpipe/sax/HTMLHighlighter.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLContentHandler.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLParser.java src/main/de/l3s/boilerpipe/sax/TagActionMap.java src/main/de/l3s/boilerpipe/sax/InputSourceable.java src/main/de/l3s/boilerpipe/sax/HTMLDocument.java src/main/de/l3s/boilerpipe/sax/CommonTagActions.java src/main/de/l3s/boilerpipe/sax/DefaultTagActionMap.java src/main/de/l3s/boilerpipe/sax/HTMLFetcher.java src/main/de/l3s/boilerpipe/sax/TagAction.java src/main/de/l3s/boilerpipe/sax/MarkupTagAction.java src/main/de/l3s/boilerpipe/util/UnicodeTokenizer.java + native2ascii -encoding UTF8 src/main/de/l3s/boilerpipe/estimators/SimpleEstimator.java src/main/de/l3s/boilerpipe/estimators/SimpleEstimator.java + for s in src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeFilter.java src/main/de/l3s/boilerpipe/BoilerpipeExtractor.java src/main/de/l3s/boilerpipe/BoilerpipeProcessingException.java src/main/de/l3s/boilerpipe/conditions/TextBlockCondition.java src/main/de/l3s/boilerpipe/document/TextBlock.java src/main/de/l3s/boilerpipe/document/TextDocumentStatistics.java src/main/de/l3s/boilerpipe/document/TextDocument.java src/main/de/l3s/boilerpipe/estimators/SimpleEstimator.java src/main/de/l3s/boilerpipe/extractors/LargestContentExtractor.java src/main/de/l3s/boilerpipe/extractors/DefaultExtractor.java src/main/de/l3s/boilerpipe/extractors/NumWordsRulesExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingWithMinKWordsExtractor.java src/main/de/l3s/boilerpipe/extractors/ExtractorBase.java src/main/de/l3s/boilerpipe/extractors/ArticleSentencesExtractor.java src/main/de/l3s/boilerpipe/extractors/CommonExtractors.java src/main/de/l3s/boilerpipe/extractors/CanolaExtractor.java src/main/de/l3s/boilerpipe/extractors/ArticleExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingExtractor.java src/main/de/l3s/boilerpipe/filters/english/HeuristicFilterBase.java src/main/de/l3s/boilerpipe/filters/english/KeepLargestFulltextBlockFilter.java src/main/de/l3s/boilerpipe/filters/english/TerminatingBlocksFinder.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFilter.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFromEndFilter.java src/main/de/l3s/boilerpipe/filters/english/DensityRulesClassifier.java src/main/de/l3s/boilerpipe/filters/english/MinFulltextWordsFilter.java src/main/de/l3s/boilerpipe/filters/english/NumWordsRulesClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/SimpleBlockFusionProcessor.java src/main/de/l3s/boilerpipe/filters/heuristics/BlockProximityFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/KeepLargestBlockFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/DocumentTitleMatchClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/LabelFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/AddPrecedingLabelsFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ExpandTitleToContentFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ContentFusion.java src/main/de/l3s/boilerpipe/filters/simple/MinWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToBoilerplateFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToContentFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/MinClauseWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/BoilerplateBlockFilter.java src/main/de/l3s/boilerpipe/filters/simple/SplitParagraphBlocksFilter.java src/main/de/l3s/boilerpipe/filters/simple/MarkEverythingContentFilter.java src/main/de/l3s/boilerpipe/labels/DefaultLabels.java src/main/de/l3s/boilerpipe/labels/ConditionalLabelAction.java src/main/de/l3s/boilerpipe/labels/LabelAction.java src/main/de/l3s/boilerpipe/sax/BoilerpipeSAXInput.java src/main/de/l3s/boilerpipe/sax/HTMLHighlighter.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLContentHandler.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLParser.java src/main/de/l3s/boilerpipe/sax/TagActionMap.java src/main/de/l3s/boilerpipe/sax/InputSourceable.java src/main/de/l3s/boilerpipe/sax/HTMLDocument.java src/main/de/l3s/boilerpipe/sax/CommonTagActions.java src/main/de/l3s/boilerpipe/sax/DefaultTagActionMap.java src/main/de/l3s/boilerpipe/sax/HTMLFetcher.java src/main/de/l3s/boilerpipe/sax/TagAction.java src/main/de/l3s/boilerpipe/sax/MarkupTagAction.java src/main/de/l3s/boilerpipe/util/UnicodeTokenizer.java + native2ascii -encoding UTF8 src/main/de/l3s/boilerpipe/extractors/LargestContentExtractor.java src/main/de/l3s/boilerpipe/extractors/LargestContentExtractor.java + for s in src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeFilter.java src/main/de/l3s/boilerpipe/BoilerpipeExtractor.java src/main/de/l3s/boilerpipe/BoilerpipeProcessingException.java src/main/de/l3s/boilerpipe/conditions/TextBlockCondition.java src/main/de/l3s/boilerpipe/document/TextBlock.java src/main/de/l3s/boilerpipe/document/TextDocumentStatistics.java src/main/de/l3s/boilerpipe/document/TextDocument.java src/main/de/l3s/boilerpipe/estimators/SimpleEstimator.java src/main/de/l3s/boilerpipe/extractors/LargestContentExtractor.java src/main/de/l3s/boilerpipe/extractors/DefaultExtractor.java src/main/de/l3s/boilerpipe/extractors/NumWordsRulesExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingWithMinKWordsExtractor.java src/main/de/l3s/boilerpipe/extractors/ExtractorBase.java src/main/de/l3s/boilerpipe/extractors/ArticleSentencesExtractor.java src/main/de/l3s/boilerpipe/extractors/CommonExtractors.java src/main/de/l3s/boilerpipe/extractors/CanolaExtractor.java src/main/de/l3s/boilerpipe/extractors/ArticleExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingExtractor.java src/main/de/l3s/boilerpipe/filters/english/HeuristicFilterBase.java src/main/de/l3s/boilerpipe/filters/english/KeepLargestFulltextBlockFilter.java src/main/de/l3s/boilerpipe/filters/english/TerminatingBlocksFinder.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFilter.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFromEndFilter.java src/main/de/l3s/boilerpipe/filters/english/DensityRulesClassifier.java src/main/de/l3s/boilerpipe/filters/english/MinFulltextWordsFilter.java src/main/de/l3s/boilerpipe/filters/english/NumWordsRulesClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/SimpleBlockFusionProcessor.java src/main/de/l3s/boilerpipe/filters/heuristics/BlockProximityFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/KeepLargestBlockFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/DocumentTitleMatchClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/LabelFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/AddPrecedingLabelsFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ExpandTitleToContentFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ContentFusion.java src/main/de/l3s/boilerpipe/filters/simple/MinWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToBoilerplateFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToContentFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/MinClauseWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/BoilerplateBlockFilter.java src/main/de/l3s/boilerpipe/filters/simple/SplitParagraphBlocksFilter.java src/main/de/l3s/boilerpipe/filters/simple/MarkEverythingContentFilter.java src/main/de/l3s/boilerpipe/labels/DefaultLabels.java src/main/de/l3s/boilerpipe/labels/ConditionalLabelAction.java src/main/de/l3s/boilerpipe/labels/LabelAction.java src/main/de/l3s/boilerpipe/sax/BoilerpipeSAXInput.java src/main/de/l3s/boilerpipe/sax/HTMLHighlighter.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLContentHandler.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLParser.java src/main/de/l3s/boilerpipe/sax/TagActionMap.java src/main/de/l3s/boilerpipe/sax/InputSourceable.java src/main/de/l3s/boilerpipe/sax/HTMLDocument.java src/main/de/l3s/boilerpipe/sax/CommonTagActions.java src/main/de/l3s/boilerpipe/sax/DefaultTagActionMap.java src/main/de/l3s/boilerpipe/sax/HTMLFetcher.java src/main/de/l3s/boilerpipe/sax/TagAction.java src/main/de/l3s/boilerpipe/sax/MarkupTagAction.java src/main/de/l3s/boilerpipe/util/UnicodeTokenizer.java + native2ascii -encoding UTF8 src/main/de/l3s/boilerpipe/extractors/DefaultExtractor.java src/main/de/l3s/boilerpipe/extractors/DefaultExtractor.java + for s in src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeFilter.java src/main/de/l3s/boilerpipe/BoilerpipeExtractor.java src/main/de/l3s/boilerpipe/BoilerpipeProcessingException.java src/main/de/l3s/boilerpipe/conditions/TextBlockCondition.java src/main/de/l3s/boilerpipe/document/TextBlock.java src/main/de/l3s/boilerpipe/document/TextDocumentStatistics.java src/main/de/l3s/boilerpipe/document/TextDocument.java src/main/de/l3s/boilerpipe/estimators/SimpleEstimator.java src/main/de/l3s/boilerpipe/extractors/LargestContentExtractor.java src/main/de/l3s/boilerpipe/extractors/DefaultExtractor.java src/main/de/l3s/boilerpipe/extractors/NumWordsRulesExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingWithMinKWordsExtractor.java src/main/de/l3s/boilerpipe/extractors/ExtractorBase.java src/main/de/l3s/boilerpipe/extractors/ArticleSentencesExtractor.java src/main/de/l3s/boilerpipe/extractors/CommonExtractors.java src/main/de/l3s/boilerpipe/extractors/CanolaExtractor.java src/main/de/l3s/boilerpipe/extractors/ArticleExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingExtractor.java src/main/de/l3s/boilerpipe/filters/english/HeuristicFilterBase.java src/main/de/l3s/boilerpipe/filters/english/KeepLargestFulltextBlockFilter.java src/main/de/l3s/boilerpipe/filters/english/TerminatingBlocksFinder.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFilter.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFromEndFilter.java src/main/de/l3s/boilerpipe/filters/english/DensityRulesClassifier.java src/main/de/l3s/boilerpipe/filters/english/MinFulltextWordsFilter.java src/main/de/l3s/boilerpipe/filters/english/NumWordsRulesClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/SimpleBlockFusionProcessor.java src/main/de/l3s/boilerpipe/filters/heuristics/BlockProximityFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/KeepLargestBlockFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/DocumentTitleMatchClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/LabelFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/AddPrecedingLabelsFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ExpandTitleToContentFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ContentFusion.java src/main/de/l3s/boilerpipe/filters/simple/MinWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToBoilerplateFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToContentFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/MinClauseWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/BoilerplateBlockFilter.java src/main/de/l3s/boilerpipe/filters/simple/SplitParagraphBlocksFilter.java src/main/de/l3s/boilerpipe/filters/simple/MarkEverythingContentFilter.java src/main/de/l3s/boilerpipe/labels/DefaultLabels.java src/main/de/l3s/boilerpipe/labels/ConditionalLabelAction.java src/main/de/l3s/boilerpipe/labels/LabelAction.java src/main/de/l3s/boilerpipe/sax/BoilerpipeSAXInput.java src/main/de/l3s/boilerpipe/sax/HTMLHighlighter.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLContentHandler.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLParser.java src/main/de/l3s/boilerpipe/sax/TagActionMap.java src/main/de/l3s/boilerpipe/sax/InputSourceable.java src/main/de/l3s/boilerpipe/sax/HTMLDocument.java src/main/de/l3s/boilerpipe/sax/CommonTagActions.java src/main/de/l3s/boilerpipe/sax/DefaultTagActionMap.java src/main/de/l3s/boilerpipe/sax/HTMLFetcher.java src/main/de/l3s/boilerpipe/sax/TagAction.java src/main/de/l3s/boilerpipe/sax/MarkupTagAction.java src/main/de/l3s/boilerpipe/util/UnicodeTokenizer.java + native2ascii -encoding UTF8 src/main/de/l3s/boilerpipe/extractors/NumWordsRulesExtractor.java src/main/de/l3s/boilerpipe/extractors/NumWordsRulesExtractor.java + for s in src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeFilter.java src/main/de/l3s/boilerpipe/BoilerpipeExtractor.java src/main/de/l3s/boilerpipe/BoilerpipeProcessingException.java src/main/de/l3s/boilerpipe/conditions/TextBlockCondition.java src/main/de/l3s/boilerpipe/document/TextBlock.java src/main/de/l3s/boilerpipe/document/TextDocumentStatistics.java src/main/de/l3s/boilerpipe/document/TextDocument.java src/main/de/l3s/boilerpipe/estimators/SimpleEstimator.java src/main/de/l3s/boilerpipe/extractors/LargestContentExtractor.java src/main/de/l3s/boilerpipe/extractors/DefaultExtractor.java src/main/de/l3s/boilerpipe/extractors/NumWordsRulesExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingWithMinKWordsExtractor.java src/main/de/l3s/boilerpipe/extractors/ExtractorBase.java src/main/de/l3s/boilerpipe/extractors/ArticleSentencesExtractor.java src/main/de/l3s/boilerpipe/extractors/CommonExtractors.java src/main/de/l3s/boilerpipe/extractors/CanolaExtractor.java src/main/de/l3s/boilerpipe/extractors/ArticleExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingExtractor.java src/main/de/l3s/boilerpipe/filters/english/HeuristicFilterBase.java src/main/de/l3s/boilerpipe/filters/english/KeepLargestFulltextBlockFilter.java src/main/de/l3s/boilerpipe/filters/english/TerminatingBlocksFinder.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFilter.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFromEndFilter.java src/main/de/l3s/boilerpipe/filters/english/DensityRulesClassifier.java src/main/de/l3s/boilerpipe/filters/english/MinFulltextWordsFilter.java src/main/de/l3s/boilerpipe/filters/english/NumWordsRulesClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/SimpleBlockFusionProcessor.java src/main/de/l3s/boilerpipe/filters/heuristics/BlockProximityFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/KeepLargestBlockFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/DocumentTitleMatchClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/LabelFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/AddPrecedingLabelsFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ExpandTitleToContentFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ContentFusion.java src/main/de/l3s/boilerpipe/filters/simple/MinWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToBoilerplateFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToContentFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/MinClauseWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/BoilerplateBlockFilter.java src/main/de/l3s/boilerpipe/filters/simple/SplitParagraphBlocksFilter.java src/main/de/l3s/boilerpipe/filters/simple/MarkEverythingContentFilter.java src/main/de/l3s/boilerpipe/labels/DefaultLabels.java src/main/de/l3s/boilerpipe/labels/ConditionalLabelAction.java src/main/de/l3s/boilerpipe/labels/LabelAction.java src/main/de/l3s/boilerpipe/sax/BoilerpipeSAXInput.java src/main/de/l3s/boilerpipe/sax/HTMLHighlighter.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLContentHandler.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLParser.java src/main/de/l3s/boilerpipe/sax/TagActionMap.java src/main/de/l3s/boilerpipe/sax/InputSourceable.java src/main/de/l3s/boilerpipe/sax/HTMLDocument.java src/main/de/l3s/boilerpipe/sax/CommonTagActions.java src/main/de/l3s/boilerpipe/sax/DefaultTagActionMap.java src/main/de/l3s/boilerpipe/sax/HTMLFetcher.java src/main/de/l3s/boilerpipe/sax/TagAction.java src/main/de/l3s/boilerpipe/sax/MarkupTagAction.java src/main/de/l3s/boilerpipe/util/UnicodeTokenizer.java + native2ascii -encoding UTF8 src/main/de/l3s/boilerpipe/extractors/KeepEverythingWithMinKWordsExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingWithMinKWordsExtractor.java + for s in src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeFilter.java src/main/de/l3s/boilerpipe/BoilerpipeExtractor.java src/main/de/l3s/boilerpipe/BoilerpipeProcessingException.java src/main/de/l3s/boilerpipe/conditions/TextBlockCondition.java src/main/de/l3s/boilerpipe/document/TextBlock.java src/main/de/l3s/boilerpipe/document/TextDocumentStatistics.java src/main/de/l3s/boilerpipe/document/TextDocument.java src/main/de/l3s/boilerpipe/estimators/SimpleEstimator.java src/main/de/l3s/boilerpipe/extractors/LargestContentExtractor.java src/main/de/l3s/boilerpipe/extractors/DefaultExtractor.java src/main/de/l3s/boilerpipe/extractors/NumWordsRulesExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingWithMinKWordsExtractor.java src/main/de/l3s/boilerpipe/extractors/ExtractorBase.java src/main/de/l3s/boilerpipe/extractors/ArticleSentencesExtractor.java src/main/de/l3s/boilerpipe/extractors/CommonExtractors.java src/main/de/l3s/boilerpipe/extractors/CanolaExtractor.java src/main/de/l3s/boilerpipe/extractors/ArticleExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingExtractor.java src/main/de/l3s/boilerpipe/filters/english/HeuristicFilterBase.java src/main/de/l3s/boilerpipe/filters/english/KeepLargestFulltextBlockFilter.java src/main/de/l3s/boilerpipe/filters/english/TerminatingBlocksFinder.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFilter.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFromEndFilter.java src/main/de/l3s/boilerpipe/filters/english/DensityRulesClassifier.java src/main/de/l3s/boilerpipe/filters/english/MinFulltextWordsFilter.java src/main/de/l3s/boilerpipe/filters/english/NumWordsRulesClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/SimpleBlockFusionProcessor.java src/main/de/l3s/boilerpipe/filters/heuristics/BlockProximityFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/KeepLargestBlockFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/DocumentTitleMatchClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/LabelFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/AddPrecedingLabelsFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ExpandTitleToContentFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ContentFusion.java src/main/de/l3s/boilerpipe/filters/simple/MinWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToBoilerplateFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToContentFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/MinClauseWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/BoilerplateBlockFilter.java src/main/de/l3s/boilerpipe/filters/simple/SplitParagraphBlocksFilter.java src/main/de/l3s/boilerpipe/filters/simple/MarkEverythingContentFilter.java src/main/de/l3s/boilerpipe/labels/DefaultLabels.java src/main/de/l3s/boilerpipe/labels/ConditionalLabelAction.java src/main/de/l3s/boilerpipe/labels/LabelAction.java src/main/de/l3s/boilerpipe/sax/BoilerpipeSAXInput.java src/main/de/l3s/boilerpipe/sax/HTMLHighlighter.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLContentHandler.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLParser.java src/main/de/l3s/boilerpipe/sax/TagActionMap.java src/main/de/l3s/boilerpipe/sax/InputSourceable.java src/main/de/l3s/boilerpipe/sax/HTMLDocument.java src/main/de/l3s/boilerpipe/sax/CommonTagActions.java src/main/de/l3s/boilerpipe/sax/DefaultTagActionMap.java src/main/de/l3s/boilerpipe/sax/HTMLFetcher.java src/main/de/l3s/boilerpipe/sax/TagAction.java src/main/de/l3s/boilerpipe/sax/MarkupTagAction.java src/main/de/l3s/boilerpipe/util/UnicodeTokenizer.java + native2ascii -encoding UTF8 src/main/de/l3s/boilerpipe/extractors/ExtractorBase.java src/main/de/l3s/boilerpipe/extractors/ExtractorBase.java + for s in src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeFilter.java src/main/de/l3s/boilerpipe/BoilerpipeExtractor.java src/main/de/l3s/boilerpipe/BoilerpipeProcessingException.java src/main/de/l3s/boilerpipe/conditions/TextBlockCondition.java src/main/de/l3s/boilerpipe/document/TextBlock.java src/main/de/l3s/boilerpipe/document/TextDocumentStatistics.java src/main/de/l3s/boilerpipe/document/TextDocument.java src/main/de/l3s/boilerpipe/estimators/SimpleEstimator.java src/main/de/l3s/boilerpipe/extractors/LargestContentExtractor.java src/main/de/l3s/boilerpipe/extractors/DefaultExtractor.java src/main/de/l3s/boilerpipe/extractors/NumWordsRulesExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingWithMinKWordsExtractor.java src/main/de/l3s/boilerpipe/extractors/ExtractorBase.java src/main/de/l3s/boilerpipe/extractors/ArticleSentencesExtractor.java src/main/de/l3s/boilerpipe/extractors/CommonExtractors.java src/main/de/l3s/boilerpipe/extractors/CanolaExtractor.java src/main/de/l3s/boilerpipe/extractors/ArticleExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingExtractor.java src/main/de/l3s/boilerpipe/filters/english/HeuristicFilterBase.java src/main/de/l3s/boilerpipe/filters/english/KeepLargestFulltextBlockFilter.java src/main/de/l3s/boilerpipe/filters/english/TerminatingBlocksFinder.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFilter.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFromEndFilter.java src/main/de/l3s/boilerpipe/filters/english/DensityRulesClassifier.java src/main/de/l3s/boilerpipe/filters/english/MinFulltextWordsFilter.java src/main/de/l3s/boilerpipe/filters/english/NumWordsRulesClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/SimpleBlockFusionProcessor.java src/main/de/l3s/boilerpipe/filters/heuristics/BlockProximityFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/KeepLargestBlockFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/DocumentTitleMatchClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/LabelFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/AddPrecedingLabelsFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ExpandTitleToContentFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ContentFusion.java src/main/de/l3s/boilerpipe/filters/simple/MinWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToBoilerplateFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToContentFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/MinClauseWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/BoilerplateBlockFilter.java src/main/de/l3s/boilerpipe/filters/simple/SplitParagraphBlocksFilter.java src/main/de/l3s/boilerpipe/filters/simple/MarkEverythingContentFilter.java src/main/de/l3s/boilerpipe/labels/DefaultLabels.java src/main/de/l3s/boilerpipe/labels/ConditionalLabelAction.java src/main/de/l3s/boilerpipe/labels/LabelAction.java src/main/de/l3s/boilerpipe/sax/BoilerpipeSAXInput.java src/main/de/l3s/boilerpipe/sax/HTMLHighlighter.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLContentHandler.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLParser.java src/main/de/l3s/boilerpipe/sax/TagActionMap.java src/main/de/l3s/boilerpipe/sax/InputSourceable.java src/main/de/l3s/boilerpipe/sax/HTMLDocument.java src/main/de/l3s/boilerpipe/sax/CommonTagActions.java src/main/de/l3s/boilerpipe/sax/DefaultTagActionMap.java src/main/de/l3s/boilerpipe/sax/HTMLFetcher.java src/main/de/l3s/boilerpipe/sax/TagAction.java src/main/de/l3s/boilerpipe/sax/MarkupTagAction.java src/main/de/l3s/boilerpipe/util/UnicodeTokenizer.java + native2ascii -encoding UTF8 src/main/de/l3s/boilerpipe/extractors/ArticleSentencesExtractor.java src/main/de/l3s/boilerpipe/extractors/ArticleSentencesExtractor.java + for s in src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeFilter.java src/main/de/l3s/boilerpipe/BoilerpipeExtractor.java src/main/de/l3s/boilerpipe/BoilerpipeProcessingException.java src/main/de/l3s/boilerpipe/conditions/TextBlockCondition.java src/main/de/l3s/boilerpipe/document/TextBlock.java src/main/de/l3s/boilerpipe/document/TextDocumentStatistics.java src/main/de/l3s/boilerpipe/document/TextDocument.java src/main/de/l3s/boilerpipe/estimators/SimpleEstimator.java src/main/de/l3s/boilerpipe/extractors/LargestContentExtractor.java src/main/de/l3s/boilerpipe/extractors/DefaultExtractor.java src/main/de/l3s/boilerpipe/extractors/NumWordsRulesExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingWithMinKWordsExtractor.java src/main/de/l3s/boilerpipe/extractors/ExtractorBase.java src/main/de/l3s/boilerpipe/extractors/ArticleSentencesExtractor.java src/main/de/l3s/boilerpipe/extractors/CommonExtractors.java src/main/de/l3s/boilerpipe/extractors/CanolaExtractor.java src/main/de/l3s/boilerpipe/extractors/ArticleExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingExtractor.java src/main/de/l3s/boilerpipe/filters/english/HeuristicFilterBase.java src/main/de/l3s/boilerpipe/filters/english/KeepLargestFulltextBlockFilter.java src/main/de/l3s/boilerpipe/filters/english/TerminatingBlocksFinder.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFilter.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFromEndFilter.java src/main/de/l3s/boilerpipe/filters/english/DensityRulesClassifier.java src/main/de/l3s/boilerpipe/filters/english/MinFulltextWordsFilter.java src/main/de/l3s/boilerpipe/filters/english/NumWordsRulesClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/SimpleBlockFusionProcessor.java src/main/de/l3s/boilerpipe/filters/heuristics/BlockProximityFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/KeepLargestBlockFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/DocumentTitleMatchClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/LabelFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/AddPrecedingLabelsFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ExpandTitleToContentFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ContentFusion.java src/main/de/l3s/boilerpipe/filters/simple/MinWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToBoilerplateFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToContentFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/MinClauseWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/BoilerplateBlockFilter.java src/main/de/l3s/boilerpipe/filters/simple/SplitParagraphBlocksFilter.java src/main/de/l3s/boilerpipe/filters/simple/MarkEverythingContentFilter.java src/main/de/l3s/boilerpipe/labels/DefaultLabels.java src/main/de/l3s/boilerpipe/labels/ConditionalLabelAction.java src/main/de/l3s/boilerpipe/labels/LabelAction.java src/main/de/l3s/boilerpipe/sax/BoilerpipeSAXInput.java src/main/de/l3s/boilerpipe/sax/HTMLHighlighter.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLContentHandler.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLParser.java src/main/de/l3s/boilerpipe/sax/TagActionMap.java src/main/de/l3s/boilerpipe/sax/InputSourceable.java src/main/de/l3s/boilerpipe/sax/HTMLDocument.java src/main/de/l3s/boilerpipe/sax/CommonTagActions.java src/main/de/l3s/boilerpipe/sax/DefaultTagActionMap.java src/main/de/l3s/boilerpipe/sax/HTMLFetcher.java src/main/de/l3s/boilerpipe/sax/TagAction.java src/main/de/l3s/boilerpipe/sax/MarkupTagAction.java src/main/de/l3s/boilerpipe/util/UnicodeTokenizer.java + native2ascii -encoding UTF8 src/main/de/l3s/boilerpipe/extractors/CommonExtractors.java src/main/de/l3s/boilerpipe/extractors/CommonExtractors.java + for s in src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeFilter.java src/main/de/l3s/boilerpipe/BoilerpipeExtractor.java src/main/de/l3s/boilerpipe/BoilerpipeProcessingException.java src/main/de/l3s/boilerpipe/conditions/TextBlockCondition.java src/main/de/l3s/boilerpipe/document/TextBlock.java src/main/de/l3s/boilerpipe/document/TextDocumentStatistics.java src/main/de/l3s/boilerpipe/document/TextDocument.java src/main/de/l3s/boilerpipe/estimators/SimpleEstimator.java src/main/de/l3s/boilerpipe/extractors/LargestContentExtractor.java src/main/de/l3s/boilerpipe/extractors/DefaultExtractor.java src/main/de/l3s/boilerpipe/extractors/NumWordsRulesExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingWithMinKWordsExtractor.java src/main/de/l3s/boilerpipe/extractors/ExtractorBase.java src/main/de/l3s/boilerpipe/extractors/ArticleSentencesExtractor.java src/main/de/l3s/boilerpipe/extractors/CommonExtractors.java src/main/de/l3s/boilerpipe/extractors/CanolaExtractor.java src/main/de/l3s/boilerpipe/extractors/ArticleExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingExtractor.java src/main/de/l3s/boilerpipe/filters/english/HeuristicFilterBase.java src/main/de/l3s/boilerpipe/filters/english/KeepLargestFulltextBlockFilter.java src/main/de/l3s/boilerpipe/filters/english/TerminatingBlocksFinder.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFilter.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFromEndFilter.java src/main/de/l3s/boilerpipe/filters/english/DensityRulesClassifier.java src/main/de/l3s/boilerpipe/filters/english/MinFulltextWordsFilter.java src/main/de/l3s/boilerpipe/filters/english/NumWordsRulesClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/SimpleBlockFusionProcessor.java src/main/de/l3s/boilerpipe/filters/heuristics/BlockProximityFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/KeepLargestBlockFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/DocumentTitleMatchClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/LabelFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/AddPrecedingLabelsFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ExpandTitleToContentFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ContentFusion.java src/main/de/l3s/boilerpipe/filters/simple/MinWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToBoilerplateFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToContentFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/MinClauseWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/BoilerplateBlockFilter.java src/main/de/l3s/boilerpipe/filters/simple/SplitParagraphBlocksFilter.java src/main/de/l3s/boilerpipe/filters/simple/MarkEverythingContentFilter.java src/main/de/l3s/boilerpipe/labels/DefaultLabels.java src/main/de/l3s/boilerpipe/labels/ConditionalLabelAction.java src/main/de/l3s/boilerpipe/labels/LabelAction.java src/main/de/l3s/boilerpipe/sax/BoilerpipeSAXInput.java src/main/de/l3s/boilerpipe/sax/HTMLHighlighter.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLContentHandler.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLParser.java src/main/de/l3s/boilerpipe/sax/TagActionMap.java src/main/de/l3s/boilerpipe/sax/InputSourceable.java src/main/de/l3s/boilerpipe/sax/HTMLDocument.java src/main/de/l3s/boilerpipe/sax/CommonTagActions.java src/main/de/l3s/boilerpipe/sax/DefaultTagActionMap.java src/main/de/l3s/boilerpipe/sax/HTMLFetcher.java src/main/de/l3s/boilerpipe/sax/TagAction.java src/main/de/l3s/boilerpipe/sax/MarkupTagAction.java src/main/de/l3s/boilerpipe/util/UnicodeTokenizer.java + native2ascii -encoding UTF8 src/main/de/l3s/boilerpipe/extractors/CanolaExtractor.java src/main/de/l3s/boilerpipe/extractors/CanolaExtractor.java + for s in src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeFilter.java src/main/de/l3s/boilerpipe/BoilerpipeExtractor.java src/main/de/l3s/boilerpipe/BoilerpipeProcessingException.java src/main/de/l3s/boilerpipe/conditions/TextBlockCondition.java src/main/de/l3s/boilerpipe/document/TextBlock.java src/main/de/l3s/boilerpipe/document/TextDocumentStatistics.java src/main/de/l3s/boilerpipe/document/TextDocument.java src/main/de/l3s/boilerpipe/estimators/SimpleEstimator.java src/main/de/l3s/boilerpipe/extractors/LargestContentExtractor.java src/main/de/l3s/boilerpipe/extractors/DefaultExtractor.java src/main/de/l3s/boilerpipe/extractors/NumWordsRulesExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingWithMinKWordsExtractor.java src/main/de/l3s/boilerpipe/extractors/ExtractorBase.java src/main/de/l3s/boilerpipe/extractors/ArticleSentencesExtractor.java src/main/de/l3s/boilerpipe/extractors/CommonExtractors.java src/main/de/l3s/boilerpipe/extractors/CanolaExtractor.java src/main/de/l3s/boilerpipe/extractors/ArticleExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingExtractor.java src/main/de/l3s/boilerpipe/filters/english/HeuristicFilterBase.java src/main/de/l3s/boilerpipe/filters/english/KeepLargestFulltextBlockFilter.java src/main/de/l3s/boilerpipe/filters/english/TerminatingBlocksFinder.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFilter.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFromEndFilter.java src/main/de/l3s/boilerpipe/filters/english/DensityRulesClassifier.java src/main/de/l3s/boilerpipe/filters/english/MinFulltextWordsFilter.java src/main/de/l3s/boilerpipe/filters/english/NumWordsRulesClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/SimpleBlockFusionProcessor.java src/main/de/l3s/boilerpipe/filters/heuristics/BlockProximityFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/KeepLargestBlockFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/DocumentTitleMatchClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/LabelFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/AddPrecedingLabelsFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ExpandTitleToContentFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ContentFusion.java src/main/de/l3s/boilerpipe/filters/simple/MinWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToBoilerplateFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToContentFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/MinClauseWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/BoilerplateBlockFilter.java src/main/de/l3s/boilerpipe/filters/simple/SplitParagraphBlocksFilter.java src/main/de/l3s/boilerpipe/filters/simple/MarkEverythingContentFilter.java src/main/de/l3s/boilerpipe/labels/DefaultLabels.java src/main/de/l3s/boilerpipe/labels/ConditionalLabelAction.java src/main/de/l3s/boilerpipe/labels/LabelAction.java src/main/de/l3s/boilerpipe/sax/BoilerpipeSAXInput.java src/main/de/l3s/boilerpipe/sax/HTMLHighlighter.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLContentHandler.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLParser.java src/main/de/l3s/boilerpipe/sax/TagActionMap.java src/main/de/l3s/boilerpipe/sax/InputSourceable.java src/main/de/l3s/boilerpipe/sax/HTMLDocument.java src/main/de/l3s/boilerpipe/sax/CommonTagActions.java src/main/de/l3s/boilerpipe/sax/DefaultTagActionMap.java src/main/de/l3s/boilerpipe/sax/HTMLFetcher.java src/main/de/l3s/boilerpipe/sax/TagAction.java src/main/de/l3s/boilerpipe/sax/MarkupTagAction.java src/main/de/l3s/boilerpipe/util/UnicodeTokenizer.java + native2ascii -encoding UTF8 src/main/de/l3s/boilerpipe/extractors/ArticleExtractor.java src/main/de/l3s/boilerpipe/extractors/ArticleExtractor.java + for s in src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeFilter.java src/main/de/l3s/boilerpipe/BoilerpipeExtractor.java src/main/de/l3s/boilerpipe/BoilerpipeProcessingException.java src/main/de/l3s/boilerpipe/conditions/TextBlockCondition.java src/main/de/l3s/boilerpipe/document/TextBlock.java src/main/de/l3s/boilerpipe/document/TextDocumentStatistics.java src/main/de/l3s/boilerpipe/document/TextDocument.java src/main/de/l3s/boilerpipe/estimators/SimpleEstimator.java src/main/de/l3s/boilerpipe/extractors/LargestContentExtractor.java src/main/de/l3s/boilerpipe/extractors/DefaultExtractor.java src/main/de/l3s/boilerpipe/extractors/NumWordsRulesExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingWithMinKWordsExtractor.java src/main/de/l3s/boilerpipe/extractors/ExtractorBase.java src/main/de/l3s/boilerpipe/extractors/ArticleSentencesExtractor.java src/main/de/l3s/boilerpipe/extractors/CommonExtractors.java src/main/de/l3s/boilerpipe/extractors/CanolaExtractor.java src/main/de/l3s/boilerpipe/extractors/ArticleExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingExtractor.java src/main/de/l3s/boilerpipe/filters/english/HeuristicFilterBase.java src/main/de/l3s/boilerpipe/filters/english/KeepLargestFulltextBlockFilter.java src/main/de/l3s/boilerpipe/filters/english/TerminatingBlocksFinder.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFilter.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFromEndFilter.java src/main/de/l3s/boilerpipe/filters/english/DensityRulesClassifier.java src/main/de/l3s/boilerpipe/filters/english/MinFulltextWordsFilter.java src/main/de/l3s/boilerpipe/filters/english/NumWordsRulesClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/SimpleBlockFusionProcessor.java src/main/de/l3s/boilerpipe/filters/heuristics/BlockProximityFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/KeepLargestBlockFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/DocumentTitleMatchClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/LabelFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/AddPrecedingLabelsFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ExpandTitleToContentFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ContentFusion.java src/main/de/l3s/boilerpipe/filters/simple/MinWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToBoilerplateFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToContentFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/MinClauseWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/BoilerplateBlockFilter.java src/main/de/l3s/boilerpipe/filters/simple/SplitParagraphBlocksFilter.java src/main/de/l3s/boilerpipe/filters/simple/MarkEverythingContentFilter.java src/main/de/l3s/boilerpipe/labels/DefaultLabels.java src/main/de/l3s/boilerpipe/labels/ConditionalLabelAction.java src/main/de/l3s/boilerpipe/labels/LabelAction.java src/main/de/l3s/boilerpipe/sax/BoilerpipeSAXInput.java src/main/de/l3s/boilerpipe/sax/HTMLHighlighter.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLContentHandler.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLParser.java src/main/de/l3s/boilerpipe/sax/TagActionMap.java src/main/de/l3s/boilerpipe/sax/InputSourceable.java src/main/de/l3s/boilerpipe/sax/HTMLDocument.java src/main/de/l3s/boilerpipe/sax/CommonTagActions.java src/main/de/l3s/boilerpipe/sax/DefaultTagActionMap.java src/main/de/l3s/boilerpipe/sax/HTMLFetcher.java src/main/de/l3s/boilerpipe/sax/TagAction.java src/main/de/l3s/boilerpipe/sax/MarkupTagAction.java src/main/de/l3s/boilerpipe/util/UnicodeTokenizer.java + native2ascii -encoding UTF8 src/main/de/l3s/boilerpipe/extractors/KeepEverythingExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingExtractor.java + for s in src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeFilter.java src/main/de/l3s/boilerpipe/BoilerpipeExtractor.java src/main/de/l3s/boilerpipe/BoilerpipeProcessingException.java src/main/de/l3s/boilerpipe/conditions/TextBlockCondition.java src/main/de/l3s/boilerpipe/document/TextBlock.java src/main/de/l3s/boilerpipe/document/TextDocumentStatistics.java src/main/de/l3s/boilerpipe/document/TextDocument.java src/main/de/l3s/boilerpipe/estimators/SimpleEstimator.java src/main/de/l3s/boilerpipe/extractors/LargestContentExtractor.java src/main/de/l3s/boilerpipe/extractors/DefaultExtractor.java src/main/de/l3s/boilerpipe/extractors/NumWordsRulesExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingWithMinKWordsExtractor.java src/main/de/l3s/boilerpipe/extractors/ExtractorBase.java src/main/de/l3s/boilerpipe/extractors/ArticleSentencesExtractor.java src/main/de/l3s/boilerpipe/extractors/CommonExtractors.java src/main/de/l3s/boilerpipe/extractors/CanolaExtractor.java src/main/de/l3s/boilerpipe/extractors/ArticleExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingExtractor.java src/main/de/l3s/boilerpipe/filters/english/HeuristicFilterBase.java src/main/de/l3s/boilerpipe/filters/english/KeepLargestFulltextBlockFilter.java src/main/de/l3s/boilerpipe/filters/english/TerminatingBlocksFinder.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFilter.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFromEndFilter.java src/main/de/l3s/boilerpipe/filters/english/DensityRulesClassifier.java src/main/de/l3s/boilerpipe/filters/english/MinFulltextWordsFilter.java src/main/de/l3s/boilerpipe/filters/english/NumWordsRulesClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/SimpleBlockFusionProcessor.java src/main/de/l3s/boilerpipe/filters/heuristics/BlockProximityFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/KeepLargestBlockFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/DocumentTitleMatchClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/LabelFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/AddPrecedingLabelsFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ExpandTitleToContentFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ContentFusion.java src/main/de/l3s/boilerpipe/filters/simple/MinWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToBoilerplateFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToContentFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/MinClauseWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/BoilerplateBlockFilter.java src/main/de/l3s/boilerpipe/filters/simple/SplitParagraphBlocksFilter.java src/main/de/l3s/boilerpipe/filters/simple/MarkEverythingContentFilter.java src/main/de/l3s/boilerpipe/labels/DefaultLabels.java src/main/de/l3s/boilerpipe/labels/ConditionalLabelAction.java src/main/de/l3s/boilerpipe/labels/LabelAction.java src/main/de/l3s/boilerpipe/sax/BoilerpipeSAXInput.java src/main/de/l3s/boilerpipe/sax/HTMLHighlighter.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLContentHandler.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLParser.java src/main/de/l3s/boilerpipe/sax/TagActionMap.java src/main/de/l3s/boilerpipe/sax/InputSourceable.java src/main/de/l3s/boilerpipe/sax/HTMLDocument.java src/main/de/l3s/boilerpipe/sax/CommonTagActions.java src/main/de/l3s/boilerpipe/sax/DefaultTagActionMap.java src/main/de/l3s/boilerpipe/sax/HTMLFetcher.java src/main/de/l3s/boilerpipe/sax/TagAction.java src/main/de/l3s/boilerpipe/sax/MarkupTagAction.java src/main/de/l3s/boilerpipe/util/UnicodeTokenizer.java + native2ascii -encoding UTF8 src/main/de/l3s/boilerpipe/filters/english/HeuristicFilterBase.java src/main/de/l3s/boilerpipe/filters/english/HeuristicFilterBase.java + for s in src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeFilter.java src/main/de/l3s/boilerpipe/BoilerpipeExtractor.java src/main/de/l3s/boilerpipe/BoilerpipeProcessingException.java src/main/de/l3s/boilerpipe/conditions/TextBlockCondition.java src/main/de/l3s/boilerpipe/document/TextBlock.java src/main/de/l3s/boilerpipe/document/TextDocumentStatistics.java src/main/de/l3s/boilerpipe/document/TextDocument.java src/main/de/l3s/boilerpipe/estimators/SimpleEstimator.java src/main/de/l3s/boilerpipe/extractors/LargestContentExtractor.java src/main/de/l3s/boilerpipe/extractors/DefaultExtractor.java src/main/de/l3s/boilerpipe/extractors/NumWordsRulesExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingWithMinKWordsExtractor.java src/main/de/l3s/boilerpipe/extractors/ExtractorBase.java src/main/de/l3s/boilerpipe/extractors/ArticleSentencesExtractor.java src/main/de/l3s/boilerpipe/extractors/CommonExtractors.java src/main/de/l3s/boilerpipe/extractors/CanolaExtractor.java src/main/de/l3s/boilerpipe/extractors/ArticleExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingExtractor.java src/main/de/l3s/boilerpipe/filters/english/HeuristicFilterBase.java src/main/de/l3s/boilerpipe/filters/english/KeepLargestFulltextBlockFilter.java src/main/de/l3s/boilerpipe/filters/english/TerminatingBlocksFinder.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFilter.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFromEndFilter.java src/main/de/l3s/boilerpipe/filters/english/DensityRulesClassifier.java src/main/de/l3s/boilerpipe/filters/english/MinFulltextWordsFilter.java src/main/de/l3s/boilerpipe/filters/english/NumWordsRulesClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/SimpleBlockFusionProcessor.java src/main/de/l3s/boilerpipe/filters/heuristics/BlockProximityFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/KeepLargestBlockFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/DocumentTitleMatchClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/LabelFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/AddPrecedingLabelsFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ExpandTitleToContentFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ContentFusion.java src/main/de/l3s/boilerpipe/filters/simple/MinWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToBoilerplateFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToContentFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/MinClauseWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/BoilerplateBlockFilter.java src/main/de/l3s/boilerpipe/filters/simple/SplitParagraphBlocksFilter.java src/main/de/l3s/boilerpipe/filters/simple/MarkEverythingContentFilter.java src/main/de/l3s/boilerpipe/labels/DefaultLabels.java src/main/de/l3s/boilerpipe/labels/ConditionalLabelAction.java src/main/de/l3s/boilerpipe/labels/LabelAction.java src/main/de/l3s/boilerpipe/sax/BoilerpipeSAXInput.java src/main/de/l3s/boilerpipe/sax/HTMLHighlighter.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLContentHandler.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLParser.java src/main/de/l3s/boilerpipe/sax/TagActionMap.java src/main/de/l3s/boilerpipe/sax/InputSourceable.java src/main/de/l3s/boilerpipe/sax/HTMLDocument.java src/main/de/l3s/boilerpipe/sax/CommonTagActions.java src/main/de/l3s/boilerpipe/sax/DefaultTagActionMap.java src/main/de/l3s/boilerpipe/sax/HTMLFetcher.java src/main/de/l3s/boilerpipe/sax/TagAction.java src/main/de/l3s/boilerpipe/sax/MarkupTagAction.java src/main/de/l3s/boilerpipe/util/UnicodeTokenizer.java + native2ascii -encoding UTF8 src/main/de/l3s/boilerpipe/filters/english/KeepLargestFulltextBlockFilter.java src/main/de/l3s/boilerpipe/filters/english/KeepLargestFulltextBlockFilter.java + for s in src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeFilter.java src/main/de/l3s/boilerpipe/BoilerpipeExtractor.java src/main/de/l3s/boilerpipe/BoilerpipeProcessingException.java src/main/de/l3s/boilerpipe/conditions/TextBlockCondition.java src/main/de/l3s/boilerpipe/document/TextBlock.java src/main/de/l3s/boilerpipe/document/TextDocumentStatistics.java src/main/de/l3s/boilerpipe/document/TextDocument.java src/main/de/l3s/boilerpipe/estimators/SimpleEstimator.java src/main/de/l3s/boilerpipe/extractors/LargestContentExtractor.java src/main/de/l3s/boilerpipe/extractors/DefaultExtractor.java src/main/de/l3s/boilerpipe/extractors/NumWordsRulesExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingWithMinKWordsExtractor.java src/main/de/l3s/boilerpipe/extractors/ExtractorBase.java src/main/de/l3s/boilerpipe/extractors/ArticleSentencesExtractor.java src/main/de/l3s/boilerpipe/extractors/CommonExtractors.java src/main/de/l3s/boilerpipe/extractors/CanolaExtractor.java src/main/de/l3s/boilerpipe/extractors/ArticleExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingExtractor.java src/main/de/l3s/boilerpipe/filters/english/HeuristicFilterBase.java src/main/de/l3s/boilerpipe/filters/english/KeepLargestFulltextBlockFilter.java src/main/de/l3s/boilerpipe/filters/english/TerminatingBlocksFinder.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFilter.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFromEndFilter.java src/main/de/l3s/boilerpipe/filters/english/DensityRulesClassifier.java src/main/de/l3s/boilerpipe/filters/english/MinFulltextWordsFilter.java src/main/de/l3s/boilerpipe/filters/english/NumWordsRulesClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/SimpleBlockFusionProcessor.java src/main/de/l3s/boilerpipe/filters/heuristics/BlockProximityFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/KeepLargestBlockFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/DocumentTitleMatchClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/LabelFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/AddPrecedingLabelsFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ExpandTitleToContentFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ContentFusion.java src/main/de/l3s/boilerpipe/filters/simple/MinWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToBoilerplateFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToContentFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/MinClauseWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/BoilerplateBlockFilter.java src/main/de/l3s/boilerpipe/filters/simple/SplitParagraphBlocksFilter.java src/main/de/l3s/boilerpipe/filters/simple/MarkEverythingContentFilter.java src/main/de/l3s/boilerpipe/labels/DefaultLabels.java src/main/de/l3s/boilerpipe/labels/ConditionalLabelAction.java src/main/de/l3s/boilerpipe/labels/LabelAction.java src/main/de/l3s/boilerpipe/sax/BoilerpipeSAXInput.java src/main/de/l3s/boilerpipe/sax/HTMLHighlighter.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLContentHandler.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLParser.java src/main/de/l3s/boilerpipe/sax/TagActionMap.java src/main/de/l3s/boilerpipe/sax/InputSourceable.java src/main/de/l3s/boilerpipe/sax/HTMLDocument.java src/main/de/l3s/boilerpipe/sax/CommonTagActions.java src/main/de/l3s/boilerpipe/sax/DefaultTagActionMap.java src/main/de/l3s/boilerpipe/sax/HTMLFetcher.java src/main/de/l3s/boilerpipe/sax/TagAction.java src/main/de/l3s/boilerpipe/sax/MarkupTagAction.java src/main/de/l3s/boilerpipe/util/UnicodeTokenizer.java + native2ascii -encoding UTF8 src/main/de/l3s/boilerpipe/filters/english/TerminatingBlocksFinder.java src/main/de/l3s/boilerpipe/filters/english/TerminatingBlocksFinder.java + for s in src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeFilter.java src/main/de/l3s/boilerpipe/BoilerpipeExtractor.java src/main/de/l3s/boilerpipe/BoilerpipeProcessingException.java src/main/de/l3s/boilerpipe/conditions/TextBlockCondition.java src/main/de/l3s/boilerpipe/document/TextBlock.java src/main/de/l3s/boilerpipe/document/TextDocumentStatistics.java src/main/de/l3s/boilerpipe/document/TextDocument.java src/main/de/l3s/boilerpipe/estimators/SimpleEstimator.java src/main/de/l3s/boilerpipe/extractors/LargestContentExtractor.java src/main/de/l3s/boilerpipe/extractors/DefaultExtractor.java src/main/de/l3s/boilerpipe/extractors/NumWordsRulesExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingWithMinKWordsExtractor.java src/main/de/l3s/boilerpipe/extractors/ExtractorBase.java src/main/de/l3s/boilerpipe/extractors/ArticleSentencesExtractor.java src/main/de/l3s/boilerpipe/extractors/CommonExtractors.java src/main/de/l3s/boilerpipe/extractors/CanolaExtractor.java src/main/de/l3s/boilerpipe/extractors/ArticleExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingExtractor.java src/main/de/l3s/boilerpipe/filters/english/HeuristicFilterBase.java src/main/de/l3s/boilerpipe/filters/english/KeepLargestFulltextBlockFilter.java src/main/de/l3s/boilerpipe/filters/english/TerminatingBlocksFinder.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFilter.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFromEndFilter.java src/main/de/l3s/boilerpipe/filters/english/DensityRulesClassifier.java src/main/de/l3s/boilerpipe/filters/english/MinFulltextWordsFilter.java src/main/de/l3s/boilerpipe/filters/english/NumWordsRulesClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/SimpleBlockFusionProcessor.java src/main/de/l3s/boilerpipe/filters/heuristics/BlockProximityFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/KeepLargestBlockFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/DocumentTitleMatchClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/LabelFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/AddPrecedingLabelsFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ExpandTitleToContentFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ContentFusion.java src/main/de/l3s/boilerpipe/filters/simple/MinWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToBoilerplateFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToContentFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/MinClauseWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/BoilerplateBlockFilter.java src/main/de/l3s/boilerpipe/filters/simple/SplitParagraphBlocksFilter.java src/main/de/l3s/boilerpipe/filters/simple/MarkEverythingContentFilter.java src/main/de/l3s/boilerpipe/labels/DefaultLabels.java src/main/de/l3s/boilerpipe/labels/ConditionalLabelAction.java src/main/de/l3s/boilerpipe/labels/LabelAction.java src/main/de/l3s/boilerpipe/sax/BoilerpipeSAXInput.java src/main/de/l3s/boilerpipe/sax/HTMLHighlighter.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLContentHandler.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLParser.java src/main/de/l3s/boilerpipe/sax/TagActionMap.java src/main/de/l3s/boilerpipe/sax/InputSourceable.java src/main/de/l3s/boilerpipe/sax/HTMLDocument.java src/main/de/l3s/boilerpipe/sax/CommonTagActions.java src/main/de/l3s/boilerpipe/sax/DefaultTagActionMap.java src/main/de/l3s/boilerpipe/sax/HTMLFetcher.java src/main/de/l3s/boilerpipe/sax/TagAction.java src/main/de/l3s/boilerpipe/sax/MarkupTagAction.java src/main/de/l3s/boilerpipe/util/UnicodeTokenizer.java + native2ascii -encoding UTF8 src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFilter.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFilter.java + for s in src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeFilter.java src/main/de/l3s/boilerpipe/BoilerpipeExtractor.java src/main/de/l3s/boilerpipe/BoilerpipeProcessingException.java src/main/de/l3s/boilerpipe/conditions/TextBlockCondition.java src/main/de/l3s/boilerpipe/document/TextBlock.java src/main/de/l3s/boilerpipe/document/TextDocumentStatistics.java src/main/de/l3s/boilerpipe/document/TextDocument.java src/main/de/l3s/boilerpipe/estimators/SimpleEstimator.java src/main/de/l3s/boilerpipe/extractors/LargestContentExtractor.java src/main/de/l3s/boilerpipe/extractors/DefaultExtractor.java src/main/de/l3s/boilerpipe/extractors/NumWordsRulesExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingWithMinKWordsExtractor.java src/main/de/l3s/boilerpipe/extractors/ExtractorBase.java src/main/de/l3s/boilerpipe/extractors/ArticleSentencesExtractor.java src/main/de/l3s/boilerpipe/extractors/CommonExtractors.java src/main/de/l3s/boilerpipe/extractors/CanolaExtractor.java src/main/de/l3s/boilerpipe/extractors/ArticleExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingExtractor.java src/main/de/l3s/boilerpipe/filters/english/HeuristicFilterBase.java src/main/de/l3s/boilerpipe/filters/english/KeepLargestFulltextBlockFilter.java src/main/de/l3s/boilerpipe/filters/english/TerminatingBlocksFinder.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFilter.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFromEndFilter.java src/main/de/l3s/boilerpipe/filters/english/DensityRulesClassifier.java src/main/de/l3s/boilerpipe/filters/english/MinFulltextWordsFilter.java src/main/de/l3s/boilerpipe/filters/english/NumWordsRulesClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/SimpleBlockFusionProcessor.java src/main/de/l3s/boilerpipe/filters/heuristics/BlockProximityFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/KeepLargestBlockFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/DocumentTitleMatchClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/LabelFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/AddPrecedingLabelsFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ExpandTitleToContentFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ContentFusion.java src/main/de/l3s/boilerpipe/filters/simple/MinWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToBoilerplateFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToContentFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/MinClauseWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/BoilerplateBlockFilter.java src/main/de/l3s/boilerpipe/filters/simple/SplitParagraphBlocksFilter.java src/main/de/l3s/boilerpipe/filters/simple/MarkEverythingContentFilter.java src/main/de/l3s/boilerpipe/labels/DefaultLabels.java src/main/de/l3s/boilerpipe/labels/ConditionalLabelAction.java src/main/de/l3s/boilerpipe/labels/LabelAction.java src/main/de/l3s/boilerpipe/sax/BoilerpipeSAXInput.java src/main/de/l3s/boilerpipe/sax/HTMLHighlighter.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLContentHandler.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLParser.java src/main/de/l3s/boilerpipe/sax/TagActionMap.java src/main/de/l3s/boilerpipe/sax/InputSourceable.java src/main/de/l3s/boilerpipe/sax/HTMLDocument.java src/main/de/l3s/boilerpipe/sax/CommonTagActions.java src/main/de/l3s/boilerpipe/sax/DefaultTagActionMap.java src/main/de/l3s/boilerpipe/sax/HTMLFetcher.java src/main/de/l3s/boilerpipe/sax/TagAction.java src/main/de/l3s/boilerpipe/sax/MarkupTagAction.java src/main/de/l3s/boilerpipe/util/UnicodeTokenizer.java + native2ascii -encoding UTF8 src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFromEndFilter.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFromEndFilter.java + for s in src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeFilter.java src/main/de/l3s/boilerpipe/BoilerpipeExtractor.java src/main/de/l3s/boilerpipe/BoilerpipeProcessingException.java src/main/de/l3s/boilerpipe/conditions/TextBlockCondition.java src/main/de/l3s/boilerpipe/document/TextBlock.java src/main/de/l3s/boilerpipe/document/TextDocumentStatistics.java src/main/de/l3s/boilerpipe/document/TextDocument.java src/main/de/l3s/boilerpipe/estimators/SimpleEstimator.java src/main/de/l3s/boilerpipe/extractors/LargestContentExtractor.java src/main/de/l3s/boilerpipe/extractors/DefaultExtractor.java src/main/de/l3s/boilerpipe/extractors/NumWordsRulesExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingWithMinKWordsExtractor.java src/main/de/l3s/boilerpipe/extractors/ExtractorBase.java src/main/de/l3s/boilerpipe/extractors/ArticleSentencesExtractor.java src/main/de/l3s/boilerpipe/extractors/CommonExtractors.java src/main/de/l3s/boilerpipe/extractors/CanolaExtractor.java src/main/de/l3s/boilerpipe/extractors/ArticleExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingExtractor.java src/main/de/l3s/boilerpipe/filters/english/HeuristicFilterBase.java src/main/de/l3s/boilerpipe/filters/english/KeepLargestFulltextBlockFilter.java src/main/de/l3s/boilerpipe/filters/english/TerminatingBlocksFinder.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFilter.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFromEndFilter.java src/main/de/l3s/boilerpipe/filters/english/DensityRulesClassifier.java src/main/de/l3s/boilerpipe/filters/english/MinFulltextWordsFilter.java src/main/de/l3s/boilerpipe/filters/english/NumWordsRulesClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/SimpleBlockFusionProcessor.java src/main/de/l3s/boilerpipe/filters/heuristics/BlockProximityFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/KeepLargestBlockFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/DocumentTitleMatchClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/LabelFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/AddPrecedingLabelsFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ExpandTitleToContentFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ContentFusion.java src/main/de/l3s/boilerpipe/filters/simple/MinWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToBoilerplateFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToContentFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/MinClauseWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/BoilerplateBlockFilter.java src/main/de/l3s/boilerpipe/filters/simple/SplitParagraphBlocksFilter.java src/main/de/l3s/boilerpipe/filters/simple/MarkEverythingContentFilter.java src/main/de/l3s/boilerpipe/labels/DefaultLabels.java src/main/de/l3s/boilerpipe/labels/ConditionalLabelAction.java src/main/de/l3s/boilerpipe/labels/LabelAction.java src/main/de/l3s/boilerpipe/sax/BoilerpipeSAXInput.java src/main/de/l3s/boilerpipe/sax/HTMLHighlighter.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLContentHandler.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLParser.java src/main/de/l3s/boilerpipe/sax/TagActionMap.java src/main/de/l3s/boilerpipe/sax/InputSourceable.java src/main/de/l3s/boilerpipe/sax/HTMLDocument.java src/main/de/l3s/boilerpipe/sax/CommonTagActions.java src/main/de/l3s/boilerpipe/sax/DefaultTagActionMap.java src/main/de/l3s/boilerpipe/sax/HTMLFetcher.java src/main/de/l3s/boilerpipe/sax/TagAction.java src/main/de/l3s/boilerpipe/sax/MarkupTagAction.java src/main/de/l3s/boilerpipe/util/UnicodeTokenizer.java + native2ascii -encoding UTF8 src/main/de/l3s/boilerpipe/filters/english/DensityRulesClassifier.java src/main/de/l3s/boilerpipe/filters/english/DensityRulesClassifier.java + for s in src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeFilter.java src/main/de/l3s/boilerpipe/BoilerpipeExtractor.java src/main/de/l3s/boilerpipe/BoilerpipeProcessingException.java src/main/de/l3s/boilerpipe/conditions/TextBlockCondition.java src/main/de/l3s/boilerpipe/document/TextBlock.java src/main/de/l3s/boilerpipe/document/TextDocumentStatistics.java src/main/de/l3s/boilerpipe/document/TextDocument.java src/main/de/l3s/boilerpipe/estimators/SimpleEstimator.java src/main/de/l3s/boilerpipe/extractors/LargestContentExtractor.java src/main/de/l3s/boilerpipe/extractors/DefaultExtractor.java src/main/de/l3s/boilerpipe/extractors/NumWordsRulesExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingWithMinKWordsExtractor.java src/main/de/l3s/boilerpipe/extractors/ExtractorBase.java src/main/de/l3s/boilerpipe/extractors/ArticleSentencesExtractor.java src/main/de/l3s/boilerpipe/extractors/CommonExtractors.java src/main/de/l3s/boilerpipe/extractors/CanolaExtractor.java src/main/de/l3s/boilerpipe/extractors/ArticleExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingExtractor.java src/main/de/l3s/boilerpipe/filters/english/HeuristicFilterBase.java src/main/de/l3s/boilerpipe/filters/english/KeepLargestFulltextBlockFilter.java src/main/de/l3s/boilerpipe/filters/english/TerminatingBlocksFinder.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFilter.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFromEndFilter.java src/main/de/l3s/boilerpipe/filters/english/DensityRulesClassifier.java src/main/de/l3s/boilerpipe/filters/english/MinFulltextWordsFilter.java src/main/de/l3s/boilerpipe/filters/english/NumWordsRulesClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/SimpleBlockFusionProcessor.java src/main/de/l3s/boilerpipe/filters/heuristics/BlockProximityFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/KeepLargestBlockFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/DocumentTitleMatchClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/LabelFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/AddPrecedingLabelsFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ExpandTitleToContentFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ContentFusion.java src/main/de/l3s/boilerpipe/filters/simple/MinWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToBoilerplateFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToContentFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/MinClauseWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/BoilerplateBlockFilter.java src/main/de/l3s/boilerpipe/filters/simple/SplitParagraphBlocksFilter.java src/main/de/l3s/boilerpipe/filters/simple/MarkEverythingContentFilter.java src/main/de/l3s/boilerpipe/labels/DefaultLabels.java src/main/de/l3s/boilerpipe/labels/ConditionalLabelAction.java src/main/de/l3s/boilerpipe/labels/LabelAction.java src/main/de/l3s/boilerpipe/sax/BoilerpipeSAXInput.java src/main/de/l3s/boilerpipe/sax/HTMLHighlighter.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLContentHandler.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLParser.java src/main/de/l3s/boilerpipe/sax/TagActionMap.java src/main/de/l3s/boilerpipe/sax/InputSourceable.java src/main/de/l3s/boilerpipe/sax/HTMLDocument.java src/main/de/l3s/boilerpipe/sax/CommonTagActions.java src/main/de/l3s/boilerpipe/sax/DefaultTagActionMap.java src/main/de/l3s/boilerpipe/sax/HTMLFetcher.java src/main/de/l3s/boilerpipe/sax/TagAction.java src/main/de/l3s/boilerpipe/sax/MarkupTagAction.java src/main/de/l3s/boilerpipe/util/UnicodeTokenizer.java + native2ascii -encoding UTF8 src/main/de/l3s/boilerpipe/filters/english/MinFulltextWordsFilter.java src/main/de/l3s/boilerpipe/filters/english/MinFulltextWordsFilter.java + for s in src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeFilter.java src/main/de/l3s/boilerpipe/BoilerpipeExtractor.java src/main/de/l3s/boilerpipe/BoilerpipeProcessingException.java src/main/de/l3s/boilerpipe/conditions/TextBlockCondition.java src/main/de/l3s/boilerpipe/document/TextBlock.java src/main/de/l3s/boilerpipe/document/TextDocumentStatistics.java src/main/de/l3s/boilerpipe/document/TextDocument.java src/main/de/l3s/boilerpipe/estimators/SimpleEstimator.java src/main/de/l3s/boilerpipe/extractors/LargestContentExtractor.java src/main/de/l3s/boilerpipe/extractors/DefaultExtractor.java src/main/de/l3s/boilerpipe/extractors/NumWordsRulesExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingWithMinKWordsExtractor.java src/main/de/l3s/boilerpipe/extractors/ExtractorBase.java src/main/de/l3s/boilerpipe/extractors/ArticleSentencesExtractor.java src/main/de/l3s/boilerpipe/extractors/CommonExtractors.java src/main/de/l3s/boilerpipe/extractors/CanolaExtractor.java src/main/de/l3s/boilerpipe/extractors/ArticleExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingExtractor.java src/main/de/l3s/boilerpipe/filters/english/HeuristicFilterBase.java src/main/de/l3s/boilerpipe/filters/english/KeepLargestFulltextBlockFilter.java src/main/de/l3s/boilerpipe/filters/english/TerminatingBlocksFinder.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFilter.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFromEndFilter.java src/main/de/l3s/boilerpipe/filters/english/DensityRulesClassifier.java src/main/de/l3s/boilerpipe/filters/english/MinFulltextWordsFilter.java src/main/de/l3s/boilerpipe/filters/english/NumWordsRulesClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/SimpleBlockFusionProcessor.java src/main/de/l3s/boilerpipe/filters/heuristics/BlockProximityFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/KeepLargestBlockFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/DocumentTitleMatchClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/LabelFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/AddPrecedingLabelsFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ExpandTitleToContentFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ContentFusion.java src/main/de/l3s/boilerpipe/filters/simple/MinWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToBoilerplateFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToContentFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/MinClauseWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/BoilerplateBlockFilter.java src/main/de/l3s/boilerpipe/filters/simple/SplitParagraphBlocksFilter.java src/main/de/l3s/boilerpipe/filters/simple/MarkEverythingContentFilter.java src/main/de/l3s/boilerpipe/labels/DefaultLabels.java src/main/de/l3s/boilerpipe/labels/ConditionalLabelAction.java src/main/de/l3s/boilerpipe/labels/LabelAction.java src/main/de/l3s/boilerpipe/sax/BoilerpipeSAXInput.java src/main/de/l3s/boilerpipe/sax/HTMLHighlighter.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLContentHandler.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLParser.java src/main/de/l3s/boilerpipe/sax/TagActionMap.java src/main/de/l3s/boilerpipe/sax/InputSourceable.java src/main/de/l3s/boilerpipe/sax/HTMLDocument.java src/main/de/l3s/boilerpipe/sax/CommonTagActions.java src/main/de/l3s/boilerpipe/sax/DefaultTagActionMap.java src/main/de/l3s/boilerpipe/sax/HTMLFetcher.java src/main/de/l3s/boilerpipe/sax/TagAction.java src/main/de/l3s/boilerpipe/sax/MarkupTagAction.java src/main/de/l3s/boilerpipe/util/UnicodeTokenizer.java + native2ascii -encoding UTF8 src/main/de/l3s/boilerpipe/filters/english/NumWordsRulesClassifier.java src/main/de/l3s/boilerpipe/filters/english/NumWordsRulesClassifier.java + for s in src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeFilter.java src/main/de/l3s/boilerpipe/BoilerpipeExtractor.java src/main/de/l3s/boilerpipe/BoilerpipeProcessingException.java src/main/de/l3s/boilerpipe/conditions/TextBlockCondition.java src/main/de/l3s/boilerpipe/document/TextBlock.java src/main/de/l3s/boilerpipe/document/TextDocumentStatistics.java src/main/de/l3s/boilerpipe/document/TextDocument.java src/main/de/l3s/boilerpipe/estimators/SimpleEstimator.java src/main/de/l3s/boilerpipe/extractors/LargestContentExtractor.java src/main/de/l3s/boilerpipe/extractors/DefaultExtractor.java src/main/de/l3s/boilerpipe/extractors/NumWordsRulesExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingWithMinKWordsExtractor.java src/main/de/l3s/boilerpipe/extractors/ExtractorBase.java src/main/de/l3s/boilerpipe/extractors/ArticleSentencesExtractor.java src/main/de/l3s/boilerpipe/extractors/CommonExtractors.java src/main/de/l3s/boilerpipe/extractors/CanolaExtractor.java src/main/de/l3s/boilerpipe/extractors/ArticleExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingExtractor.java src/main/de/l3s/boilerpipe/filters/english/HeuristicFilterBase.java src/main/de/l3s/boilerpipe/filters/english/KeepLargestFulltextBlockFilter.java src/main/de/l3s/boilerpipe/filters/english/TerminatingBlocksFinder.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFilter.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFromEndFilter.java src/main/de/l3s/boilerpipe/filters/english/DensityRulesClassifier.java src/main/de/l3s/boilerpipe/filters/english/MinFulltextWordsFilter.java src/main/de/l3s/boilerpipe/filters/english/NumWordsRulesClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/SimpleBlockFusionProcessor.java src/main/de/l3s/boilerpipe/filters/heuristics/BlockProximityFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/KeepLargestBlockFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/DocumentTitleMatchClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/LabelFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/AddPrecedingLabelsFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ExpandTitleToContentFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ContentFusion.java src/main/de/l3s/boilerpipe/filters/simple/MinWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToBoilerplateFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToContentFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/MinClauseWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/BoilerplateBlockFilter.java src/main/de/l3s/boilerpipe/filters/simple/SplitParagraphBlocksFilter.java src/main/de/l3s/boilerpipe/filters/simple/MarkEverythingContentFilter.java src/main/de/l3s/boilerpipe/labels/DefaultLabels.java src/main/de/l3s/boilerpipe/labels/ConditionalLabelAction.java src/main/de/l3s/boilerpipe/labels/LabelAction.java src/main/de/l3s/boilerpipe/sax/BoilerpipeSAXInput.java src/main/de/l3s/boilerpipe/sax/HTMLHighlighter.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLContentHandler.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLParser.java src/main/de/l3s/boilerpipe/sax/TagActionMap.java src/main/de/l3s/boilerpipe/sax/InputSourceable.java src/main/de/l3s/boilerpipe/sax/HTMLDocument.java src/main/de/l3s/boilerpipe/sax/CommonTagActions.java src/main/de/l3s/boilerpipe/sax/DefaultTagActionMap.java src/main/de/l3s/boilerpipe/sax/HTMLFetcher.java src/main/de/l3s/boilerpipe/sax/TagAction.java src/main/de/l3s/boilerpipe/sax/MarkupTagAction.java src/main/de/l3s/boilerpipe/util/UnicodeTokenizer.java + native2ascii -encoding UTF8 src/main/de/l3s/boilerpipe/filters/heuristics/SimpleBlockFusionProcessor.java src/main/de/l3s/boilerpipe/filters/heuristics/SimpleBlockFusionProcessor.java + for s in src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeFilter.java src/main/de/l3s/boilerpipe/BoilerpipeExtractor.java src/main/de/l3s/boilerpipe/BoilerpipeProcessingException.java src/main/de/l3s/boilerpipe/conditions/TextBlockCondition.java src/main/de/l3s/boilerpipe/document/TextBlock.java src/main/de/l3s/boilerpipe/document/TextDocumentStatistics.java src/main/de/l3s/boilerpipe/document/TextDocument.java src/main/de/l3s/boilerpipe/estimators/SimpleEstimator.java src/main/de/l3s/boilerpipe/extractors/LargestContentExtractor.java src/main/de/l3s/boilerpipe/extractors/DefaultExtractor.java src/main/de/l3s/boilerpipe/extractors/NumWordsRulesExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingWithMinKWordsExtractor.java src/main/de/l3s/boilerpipe/extractors/ExtractorBase.java src/main/de/l3s/boilerpipe/extractors/ArticleSentencesExtractor.java src/main/de/l3s/boilerpipe/extractors/CommonExtractors.java src/main/de/l3s/boilerpipe/extractors/CanolaExtractor.java src/main/de/l3s/boilerpipe/extractors/ArticleExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingExtractor.java src/main/de/l3s/boilerpipe/filters/english/HeuristicFilterBase.java src/main/de/l3s/boilerpipe/filters/english/KeepLargestFulltextBlockFilter.java src/main/de/l3s/boilerpipe/filters/english/TerminatingBlocksFinder.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFilter.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFromEndFilter.java src/main/de/l3s/boilerpipe/filters/english/DensityRulesClassifier.java src/main/de/l3s/boilerpipe/filters/english/MinFulltextWordsFilter.java src/main/de/l3s/boilerpipe/filters/english/NumWordsRulesClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/SimpleBlockFusionProcessor.java src/main/de/l3s/boilerpipe/filters/heuristics/BlockProximityFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/KeepLargestBlockFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/DocumentTitleMatchClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/LabelFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/AddPrecedingLabelsFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ExpandTitleToContentFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ContentFusion.java src/main/de/l3s/boilerpipe/filters/simple/MinWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToBoilerplateFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToContentFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/MinClauseWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/BoilerplateBlockFilter.java src/main/de/l3s/boilerpipe/filters/simple/SplitParagraphBlocksFilter.java src/main/de/l3s/boilerpipe/filters/simple/MarkEverythingContentFilter.java src/main/de/l3s/boilerpipe/labels/DefaultLabels.java src/main/de/l3s/boilerpipe/labels/ConditionalLabelAction.java src/main/de/l3s/boilerpipe/labels/LabelAction.java src/main/de/l3s/boilerpipe/sax/BoilerpipeSAXInput.java src/main/de/l3s/boilerpipe/sax/HTMLHighlighter.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLContentHandler.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLParser.java src/main/de/l3s/boilerpipe/sax/TagActionMap.java src/main/de/l3s/boilerpipe/sax/InputSourceable.java src/main/de/l3s/boilerpipe/sax/HTMLDocument.java src/main/de/l3s/boilerpipe/sax/CommonTagActions.java src/main/de/l3s/boilerpipe/sax/DefaultTagActionMap.java src/main/de/l3s/boilerpipe/sax/HTMLFetcher.java src/main/de/l3s/boilerpipe/sax/TagAction.java src/main/de/l3s/boilerpipe/sax/MarkupTagAction.java src/main/de/l3s/boilerpipe/util/UnicodeTokenizer.java + native2ascii -encoding UTF8 src/main/de/l3s/boilerpipe/filters/heuristics/BlockProximityFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/BlockProximityFusion.java + for s in src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeFilter.java src/main/de/l3s/boilerpipe/BoilerpipeExtractor.java src/main/de/l3s/boilerpipe/BoilerpipeProcessingException.java src/main/de/l3s/boilerpipe/conditions/TextBlockCondition.java src/main/de/l3s/boilerpipe/document/TextBlock.java src/main/de/l3s/boilerpipe/document/TextDocumentStatistics.java src/main/de/l3s/boilerpipe/document/TextDocument.java src/main/de/l3s/boilerpipe/estimators/SimpleEstimator.java src/main/de/l3s/boilerpipe/extractors/LargestContentExtractor.java src/main/de/l3s/boilerpipe/extractors/DefaultExtractor.java src/main/de/l3s/boilerpipe/extractors/NumWordsRulesExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingWithMinKWordsExtractor.java src/main/de/l3s/boilerpipe/extractors/ExtractorBase.java src/main/de/l3s/boilerpipe/extractors/ArticleSentencesExtractor.java src/main/de/l3s/boilerpipe/extractors/CommonExtractors.java src/main/de/l3s/boilerpipe/extractors/CanolaExtractor.java src/main/de/l3s/boilerpipe/extractors/ArticleExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingExtractor.java src/main/de/l3s/boilerpipe/filters/english/HeuristicFilterBase.java src/main/de/l3s/boilerpipe/filters/english/KeepLargestFulltextBlockFilter.java src/main/de/l3s/boilerpipe/filters/english/TerminatingBlocksFinder.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFilter.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFromEndFilter.java src/main/de/l3s/boilerpipe/filters/english/DensityRulesClassifier.java src/main/de/l3s/boilerpipe/filters/english/MinFulltextWordsFilter.java src/main/de/l3s/boilerpipe/filters/english/NumWordsRulesClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/SimpleBlockFusionProcessor.java src/main/de/l3s/boilerpipe/filters/heuristics/BlockProximityFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/KeepLargestBlockFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/DocumentTitleMatchClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/LabelFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/AddPrecedingLabelsFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ExpandTitleToContentFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ContentFusion.java src/main/de/l3s/boilerpipe/filters/simple/MinWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToBoilerplateFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToContentFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/MinClauseWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/BoilerplateBlockFilter.java src/main/de/l3s/boilerpipe/filters/simple/SplitParagraphBlocksFilter.java src/main/de/l3s/boilerpipe/filters/simple/MarkEverythingContentFilter.java src/main/de/l3s/boilerpipe/labels/DefaultLabels.java src/main/de/l3s/boilerpipe/labels/ConditionalLabelAction.java src/main/de/l3s/boilerpipe/labels/LabelAction.java src/main/de/l3s/boilerpipe/sax/BoilerpipeSAXInput.java src/main/de/l3s/boilerpipe/sax/HTMLHighlighter.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLContentHandler.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLParser.java src/main/de/l3s/boilerpipe/sax/TagActionMap.java src/main/de/l3s/boilerpipe/sax/InputSourceable.java src/main/de/l3s/boilerpipe/sax/HTMLDocument.java src/main/de/l3s/boilerpipe/sax/CommonTagActions.java src/main/de/l3s/boilerpipe/sax/DefaultTagActionMap.java src/main/de/l3s/boilerpipe/sax/HTMLFetcher.java src/main/de/l3s/boilerpipe/sax/TagAction.java src/main/de/l3s/boilerpipe/sax/MarkupTagAction.java src/main/de/l3s/boilerpipe/util/UnicodeTokenizer.java + native2ascii -encoding UTF8 src/main/de/l3s/boilerpipe/filters/heuristics/KeepLargestBlockFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/KeepLargestBlockFilter.java + for s in src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeFilter.java src/main/de/l3s/boilerpipe/BoilerpipeExtractor.java src/main/de/l3s/boilerpipe/BoilerpipeProcessingException.java src/main/de/l3s/boilerpipe/conditions/TextBlockCondition.java src/main/de/l3s/boilerpipe/document/TextBlock.java src/main/de/l3s/boilerpipe/document/TextDocumentStatistics.java src/main/de/l3s/boilerpipe/document/TextDocument.java src/main/de/l3s/boilerpipe/estimators/SimpleEstimator.java src/main/de/l3s/boilerpipe/extractors/LargestContentExtractor.java src/main/de/l3s/boilerpipe/extractors/DefaultExtractor.java src/main/de/l3s/boilerpipe/extractors/NumWordsRulesExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingWithMinKWordsExtractor.java src/main/de/l3s/boilerpipe/extractors/ExtractorBase.java src/main/de/l3s/boilerpipe/extractors/ArticleSentencesExtractor.java src/main/de/l3s/boilerpipe/extractors/CommonExtractors.java src/main/de/l3s/boilerpipe/extractors/CanolaExtractor.java src/main/de/l3s/boilerpipe/extractors/ArticleExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingExtractor.java src/main/de/l3s/boilerpipe/filters/english/HeuristicFilterBase.java src/main/de/l3s/boilerpipe/filters/english/KeepLargestFulltextBlockFilter.java src/main/de/l3s/boilerpipe/filters/english/TerminatingBlocksFinder.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFilter.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFromEndFilter.java src/main/de/l3s/boilerpipe/filters/english/DensityRulesClassifier.java src/main/de/l3s/boilerpipe/filters/english/MinFulltextWordsFilter.java src/main/de/l3s/boilerpipe/filters/english/NumWordsRulesClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/SimpleBlockFusionProcessor.java src/main/de/l3s/boilerpipe/filters/heuristics/BlockProximityFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/KeepLargestBlockFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/DocumentTitleMatchClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/LabelFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/AddPrecedingLabelsFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ExpandTitleToContentFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ContentFusion.java src/main/de/l3s/boilerpipe/filters/simple/MinWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToBoilerplateFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToContentFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/MinClauseWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/BoilerplateBlockFilter.java src/main/de/l3s/boilerpipe/filters/simple/SplitParagraphBlocksFilter.java src/main/de/l3s/boilerpipe/filters/simple/MarkEverythingContentFilter.java src/main/de/l3s/boilerpipe/labels/DefaultLabels.java src/main/de/l3s/boilerpipe/labels/ConditionalLabelAction.java src/main/de/l3s/boilerpipe/labels/LabelAction.java src/main/de/l3s/boilerpipe/sax/BoilerpipeSAXInput.java src/main/de/l3s/boilerpipe/sax/HTMLHighlighter.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLContentHandler.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLParser.java src/main/de/l3s/boilerpipe/sax/TagActionMap.java src/main/de/l3s/boilerpipe/sax/InputSourceable.java src/main/de/l3s/boilerpipe/sax/HTMLDocument.java src/main/de/l3s/boilerpipe/sax/CommonTagActions.java src/main/de/l3s/boilerpipe/sax/DefaultTagActionMap.java src/main/de/l3s/boilerpipe/sax/HTMLFetcher.java src/main/de/l3s/boilerpipe/sax/TagAction.java src/main/de/l3s/boilerpipe/sax/MarkupTagAction.java src/main/de/l3s/boilerpipe/util/UnicodeTokenizer.java + native2ascii -encoding UTF8 src/main/de/l3s/boilerpipe/filters/heuristics/DocumentTitleMatchClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/DocumentTitleMatchClassifier.java + for s in src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeFilter.java src/main/de/l3s/boilerpipe/BoilerpipeExtractor.java src/main/de/l3s/boilerpipe/BoilerpipeProcessingException.java src/main/de/l3s/boilerpipe/conditions/TextBlockCondition.java src/main/de/l3s/boilerpipe/document/TextBlock.java src/main/de/l3s/boilerpipe/document/TextDocumentStatistics.java src/main/de/l3s/boilerpipe/document/TextDocument.java src/main/de/l3s/boilerpipe/estimators/SimpleEstimator.java src/main/de/l3s/boilerpipe/extractors/LargestContentExtractor.java src/main/de/l3s/boilerpipe/extractors/DefaultExtractor.java src/main/de/l3s/boilerpipe/extractors/NumWordsRulesExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingWithMinKWordsExtractor.java src/main/de/l3s/boilerpipe/extractors/ExtractorBase.java src/main/de/l3s/boilerpipe/extractors/ArticleSentencesExtractor.java src/main/de/l3s/boilerpipe/extractors/CommonExtractors.java src/main/de/l3s/boilerpipe/extractors/CanolaExtractor.java src/main/de/l3s/boilerpipe/extractors/ArticleExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingExtractor.java src/main/de/l3s/boilerpipe/filters/english/HeuristicFilterBase.java src/main/de/l3s/boilerpipe/filters/english/KeepLargestFulltextBlockFilter.java src/main/de/l3s/boilerpipe/filters/english/TerminatingBlocksFinder.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFilter.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFromEndFilter.java src/main/de/l3s/boilerpipe/filters/english/DensityRulesClassifier.java src/main/de/l3s/boilerpipe/filters/english/MinFulltextWordsFilter.java src/main/de/l3s/boilerpipe/filters/english/NumWordsRulesClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/SimpleBlockFusionProcessor.java src/main/de/l3s/boilerpipe/filters/heuristics/BlockProximityFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/KeepLargestBlockFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/DocumentTitleMatchClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/LabelFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/AddPrecedingLabelsFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ExpandTitleToContentFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ContentFusion.java src/main/de/l3s/boilerpipe/filters/simple/MinWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToBoilerplateFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToContentFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/MinClauseWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/BoilerplateBlockFilter.java src/main/de/l3s/boilerpipe/filters/simple/SplitParagraphBlocksFilter.java src/main/de/l3s/boilerpipe/filters/simple/MarkEverythingContentFilter.java src/main/de/l3s/boilerpipe/labels/DefaultLabels.java src/main/de/l3s/boilerpipe/labels/ConditionalLabelAction.java src/main/de/l3s/boilerpipe/labels/LabelAction.java src/main/de/l3s/boilerpipe/sax/BoilerpipeSAXInput.java src/main/de/l3s/boilerpipe/sax/HTMLHighlighter.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLContentHandler.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLParser.java src/main/de/l3s/boilerpipe/sax/TagActionMap.java src/main/de/l3s/boilerpipe/sax/InputSourceable.java src/main/de/l3s/boilerpipe/sax/HTMLDocument.java src/main/de/l3s/boilerpipe/sax/CommonTagActions.java src/main/de/l3s/boilerpipe/sax/DefaultTagActionMap.java src/main/de/l3s/boilerpipe/sax/HTMLFetcher.java src/main/de/l3s/boilerpipe/sax/TagAction.java src/main/de/l3s/boilerpipe/sax/MarkupTagAction.java src/main/de/l3s/boilerpipe/util/UnicodeTokenizer.java + native2ascii -encoding UTF8 src/main/de/l3s/boilerpipe/filters/heuristics/LabelFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/LabelFusion.java + for s in src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeFilter.java src/main/de/l3s/boilerpipe/BoilerpipeExtractor.java src/main/de/l3s/boilerpipe/BoilerpipeProcessingException.java src/main/de/l3s/boilerpipe/conditions/TextBlockCondition.java src/main/de/l3s/boilerpipe/document/TextBlock.java src/main/de/l3s/boilerpipe/document/TextDocumentStatistics.java src/main/de/l3s/boilerpipe/document/TextDocument.java src/main/de/l3s/boilerpipe/estimators/SimpleEstimator.java src/main/de/l3s/boilerpipe/extractors/LargestContentExtractor.java src/main/de/l3s/boilerpipe/extractors/DefaultExtractor.java src/main/de/l3s/boilerpipe/extractors/NumWordsRulesExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingWithMinKWordsExtractor.java src/main/de/l3s/boilerpipe/extractors/ExtractorBase.java src/main/de/l3s/boilerpipe/extractors/ArticleSentencesExtractor.java src/main/de/l3s/boilerpipe/extractors/CommonExtractors.java src/main/de/l3s/boilerpipe/extractors/CanolaExtractor.java src/main/de/l3s/boilerpipe/extractors/ArticleExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingExtractor.java src/main/de/l3s/boilerpipe/filters/english/HeuristicFilterBase.java src/main/de/l3s/boilerpipe/filters/english/KeepLargestFulltextBlockFilter.java src/main/de/l3s/boilerpipe/filters/english/TerminatingBlocksFinder.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFilter.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFromEndFilter.java src/main/de/l3s/boilerpipe/filters/english/DensityRulesClassifier.java src/main/de/l3s/boilerpipe/filters/english/MinFulltextWordsFilter.java src/main/de/l3s/boilerpipe/filters/english/NumWordsRulesClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/SimpleBlockFusionProcessor.java src/main/de/l3s/boilerpipe/filters/heuristics/BlockProximityFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/KeepLargestBlockFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/DocumentTitleMatchClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/LabelFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/AddPrecedingLabelsFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ExpandTitleToContentFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ContentFusion.java src/main/de/l3s/boilerpipe/filters/simple/MinWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToBoilerplateFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToContentFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/MinClauseWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/BoilerplateBlockFilter.java src/main/de/l3s/boilerpipe/filters/simple/SplitParagraphBlocksFilter.java src/main/de/l3s/boilerpipe/filters/simple/MarkEverythingContentFilter.java src/main/de/l3s/boilerpipe/labels/DefaultLabels.java src/main/de/l3s/boilerpipe/labels/ConditionalLabelAction.java src/main/de/l3s/boilerpipe/labels/LabelAction.java src/main/de/l3s/boilerpipe/sax/BoilerpipeSAXInput.java src/main/de/l3s/boilerpipe/sax/HTMLHighlighter.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLContentHandler.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLParser.java src/main/de/l3s/boilerpipe/sax/TagActionMap.java src/main/de/l3s/boilerpipe/sax/InputSourceable.java src/main/de/l3s/boilerpipe/sax/HTMLDocument.java src/main/de/l3s/boilerpipe/sax/CommonTagActions.java src/main/de/l3s/boilerpipe/sax/DefaultTagActionMap.java src/main/de/l3s/boilerpipe/sax/HTMLFetcher.java src/main/de/l3s/boilerpipe/sax/TagAction.java src/main/de/l3s/boilerpipe/sax/MarkupTagAction.java src/main/de/l3s/boilerpipe/util/UnicodeTokenizer.java + native2ascii -encoding UTF8 src/main/de/l3s/boilerpipe/filters/heuristics/AddPrecedingLabelsFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/AddPrecedingLabelsFilter.java + for s in src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeFilter.java src/main/de/l3s/boilerpipe/BoilerpipeExtractor.java src/main/de/l3s/boilerpipe/BoilerpipeProcessingException.java src/main/de/l3s/boilerpipe/conditions/TextBlockCondition.java src/main/de/l3s/boilerpipe/document/TextBlock.java src/main/de/l3s/boilerpipe/document/TextDocumentStatistics.java src/main/de/l3s/boilerpipe/document/TextDocument.java src/main/de/l3s/boilerpipe/estimators/SimpleEstimator.java src/main/de/l3s/boilerpipe/extractors/LargestContentExtractor.java src/main/de/l3s/boilerpipe/extractors/DefaultExtractor.java src/main/de/l3s/boilerpipe/extractors/NumWordsRulesExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingWithMinKWordsExtractor.java src/main/de/l3s/boilerpipe/extractors/ExtractorBase.java src/main/de/l3s/boilerpipe/extractors/ArticleSentencesExtractor.java src/main/de/l3s/boilerpipe/extractors/CommonExtractors.java src/main/de/l3s/boilerpipe/extractors/CanolaExtractor.java src/main/de/l3s/boilerpipe/extractors/ArticleExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingExtractor.java src/main/de/l3s/boilerpipe/filters/english/HeuristicFilterBase.java src/main/de/l3s/boilerpipe/filters/english/KeepLargestFulltextBlockFilter.java src/main/de/l3s/boilerpipe/filters/english/TerminatingBlocksFinder.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFilter.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFromEndFilter.java src/main/de/l3s/boilerpipe/filters/english/DensityRulesClassifier.java src/main/de/l3s/boilerpipe/filters/english/MinFulltextWordsFilter.java src/main/de/l3s/boilerpipe/filters/english/NumWordsRulesClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/SimpleBlockFusionProcessor.java src/main/de/l3s/boilerpipe/filters/heuristics/BlockProximityFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/KeepLargestBlockFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/DocumentTitleMatchClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/LabelFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/AddPrecedingLabelsFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ExpandTitleToContentFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ContentFusion.java src/main/de/l3s/boilerpipe/filters/simple/MinWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToBoilerplateFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToContentFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/MinClauseWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/BoilerplateBlockFilter.java src/main/de/l3s/boilerpipe/filters/simple/SplitParagraphBlocksFilter.java src/main/de/l3s/boilerpipe/filters/simple/MarkEverythingContentFilter.java src/main/de/l3s/boilerpipe/labels/DefaultLabels.java src/main/de/l3s/boilerpipe/labels/ConditionalLabelAction.java src/main/de/l3s/boilerpipe/labels/LabelAction.java src/main/de/l3s/boilerpipe/sax/BoilerpipeSAXInput.java src/main/de/l3s/boilerpipe/sax/HTMLHighlighter.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLContentHandler.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLParser.java src/main/de/l3s/boilerpipe/sax/TagActionMap.java src/main/de/l3s/boilerpipe/sax/InputSourceable.java src/main/de/l3s/boilerpipe/sax/HTMLDocument.java src/main/de/l3s/boilerpipe/sax/CommonTagActions.java src/main/de/l3s/boilerpipe/sax/DefaultTagActionMap.java src/main/de/l3s/boilerpipe/sax/HTMLFetcher.java src/main/de/l3s/boilerpipe/sax/TagAction.java src/main/de/l3s/boilerpipe/sax/MarkupTagAction.java src/main/de/l3s/boilerpipe/util/UnicodeTokenizer.java + native2ascii -encoding UTF8 src/main/de/l3s/boilerpipe/filters/heuristics/ExpandTitleToContentFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ExpandTitleToContentFilter.java + for s in src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeFilter.java src/main/de/l3s/boilerpipe/BoilerpipeExtractor.java src/main/de/l3s/boilerpipe/BoilerpipeProcessingException.java src/main/de/l3s/boilerpipe/conditions/TextBlockCondition.java src/main/de/l3s/boilerpipe/document/TextBlock.java src/main/de/l3s/boilerpipe/document/TextDocumentStatistics.java src/main/de/l3s/boilerpipe/document/TextDocument.java src/main/de/l3s/boilerpipe/estimators/SimpleEstimator.java src/main/de/l3s/boilerpipe/extractors/LargestContentExtractor.java src/main/de/l3s/boilerpipe/extractors/DefaultExtractor.java src/main/de/l3s/boilerpipe/extractors/NumWordsRulesExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingWithMinKWordsExtractor.java src/main/de/l3s/boilerpipe/extractors/ExtractorBase.java src/main/de/l3s/boilerpipe/extractors/ArticleSentencesExtractor.java src/main/de/l3s/boilerpipe/extractors/CommonExtractors.java src/main/de/l3s/boilerpipe/extractors/CanolaExtractor.java src/main/de/l3s/boilerpipe/extractors/ArticleExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingExtractor.java src/main/de/l3s/boilerpipe/filters/english/HeuristicFilterBase.java src/main/de/l3s/boilerpipe/filters/english/KeepLargestFulltextBlockFilter.java src/main/de/l3s/boilerpipe/filters/english/TerminatingBlocksFinder.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFilter.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFromEndFilter.java src/main/de/l3s/boilerpipe/filters/english/DensityRulesClassifier.java src/main/de/l3s/boilerpipe/filters/english/MinFulltextWordsFilter.java src/main/de/l3s/boilerpipe/filters/english/NumWordsRulesClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/SimpleBlockFusionProcessor.java src/main/de/l3s/boilerpipe/filters/heuristics/BlockProximityFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/KeepLargestBlockFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/DocumentTitleMatchClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/LabelFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/AddPrecedingLabelsFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ExpandTitleToContentFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ContentFusion.java src/main/de/l3s/boilerpipe/filters/simple/MinWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToBoilerplateFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToContentFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/MinClauseWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/BoilerplateBlockFilter.java src/main/de/l3s/boilerpipe/filters/simple/SplitParagraphBlocksFilter.java src/main/de/l3s/boilerpipe/filters/simple/MarkEverythingContentFilter.java src/main/de/l3s/boilerpipe/labels/DefaultLabels.java src/main/de/l3s/boilerpipe/labels/ConditionalLabelAction.java src/main/de/l3s/boilerpipe/labels/LabelAction.java src/main/de/l3s/boilerpipe/sax/BoilerpipeSAXInput.java src/main/de/l3s/boilerpipe/sax/HTMLHighlighter.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLContentHandler.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLParser.java src/main/de/l3s/boilerpipe/sax/TagActionMap.java src/main/de/l3s/boilerpipe/sax/InputSourceable.java src/main/de/l3s/boilerpipe/sax/HTMLDocument.java src/main/de/l3s/boilerpipe/sax/CommonTagActions.java src/main/de/l3s/boilerpipe/sax/DefaultTagActionMap.java src/main/de/l3s/boilerpipe/sax/HTMLFetcher.java src/main/de/l3s/boilerpipe/sax/TagAction.java src/main/de/l3s/boilerpipe/sax/MarkupTagAction.java src/main/de/l3s/boilerpipe/util/UnicodeTokenizer.java + native2ascii -encoding UTF8 src/main/de/l3s/boilerpipe/filters/heuristics/ContentFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/ContentFusion.java + for s in src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeFilter.java src/main/de/l3s/boilerpipe/BoilerpipeExtractor.java src/main/de/l3s/boilerpipe/BoilerpipeProcessingException.java src/main/de/l3s/boilerpipe/conditions/TextBlockCondition.java src/main/de/l3s/boilerpipe/document/TextBlock.java src/main/de/l3s/boilerpipe/document/TextDocumentStatistics.java src/main/de/l3s/boilerpipe/document/TextDocument.java src/main/de/l3s/boilerpipe/estimators/SimpleEstimator.java src/main/de/l3s/boilerpipe/extractors/LargestContentExtractor.java src/main/de/l3s/boilerpipe/extractors/DefaultExtractor.java src/main/de/l3s/boilerpipe/extractors/NumWordsRulesExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingWithMinKWordsExtractor.java src/main/de/l3s/boilerpipe/extractors/ExtractorBase.java src/main/de/l3s/boilerpipe/extractors/ArticleSentencesExtractor.java src/main/de/l3s/boilerpipe/extractors/CommonExtractors.java src/main/de/l3s/boilerpipe/extractors/CanolaExtractor.java src/main/de/l3s/boilerpipe/extractors/ArticleExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingExtractor.java src/main/de/l3s/boilerpipe/filters/english/HeuristicFilterBase.java src/main/de/l3s/boilerpipe/filters/english/KeepLargestFulltextBlockFilter.java src/main/de/l3s/boilerpipe/filters/english/TerminatingBlocksFinder.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFilter.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFromEndFilter.java src/main/de/l3s/boilerpipe/filters/english/DensityRulesClassifier.java src/main/de/l3s/boilerpipe/filters/english/MinFulltextWordsFilter.java src/main/de/l3s/boilerpipe/filters/english/NumWordsRulesClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/SimpleBlockFusionProcessor.java src/main/de/l3s/boilerpipe/filters/heuristics/BlockProximityFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/KeepLargestBlockFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/DocumentTitleMatchClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/LabelFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/AddPrecedingLabelsFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ExpandTitleToContentFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ContentFusion.java src/main/de/l3s/boilerpipe/filters/simple/MinWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToBoilerplateFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToContentFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/MinClauseWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/BoilerplateBlockFilter.java src/main/de/l3s/boilerpipe/filters/simple/SplitParagraphBlocksFilter.java src/main/de/l3s/boilerpipe/filters/simple/MarkEverythingContentFilter.java src/main/de/l3s/boilerpipe/labels/DefaultLabels.java src/main/de/l3s/boilerpipe/labels/ConditionalLabelAction.java src/main/de/l3s/boilerpipe/labels/LabelAction.java src/main/de/l3s/boilerpipe/sax/BoilerpipeSAXInput.java src/main/de/l3s/boilerpipe/sax/HTMLHighlighter.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLContentHandler.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLParser.java src/main/de/l3s/boilerpipe/sax/TagActionMap.java src/main/de/l3s/boilerpipe/sax/InputSourceable.java src/main/de/l3s/boilerpipe/sax/HTMLDocument.java src/main/de/l3s/boilerpipe/sax/CommonTagActions.java src/main/de/l3s/boilerpipe/sax/DefaultTagActionMap.java src/main/de/l3s/boilerpipe/sax/HTMLFetcher.java src/main/de/l3s/boilerpipe/sax/TagAction.java src/main/de/l3s/boilerpipe/sax/MarkupTagAction.java src/main/de/l3s/boilerpipe/util/UnicodeTokenizer.java + native2ascii -encoding UTF8 src/main/de/l3s/boilerpipe/filters/simple/MinWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/MinWordsFilter.java + for s in src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeFilter.java src/main/de/l3s/boilerpipe/BoilerpipeExtractor.java src/main/de/l3s/boilerpipe/BoilerpipeProcessingException.java src/main/de/l3s/boilerpipe/conditions/TextBlockCondition.java src/main/de/l3s/boilerpipe/document/TextBlock.java src/main/de/l3s/boilerpipe/document/TextDocumentStatistics.java src/main/de/l3s/boilerpipe/document/TextDocument.java src/main/de/l3s/boilerpipe/estimators/SimpleEstimator.java src/main/de/l3s/boilerpipe/extractors/LargestContentExtractor.java src/main/de/l3s/boilerpipe/extractors/DefaultExtractor.java src/main/de/l3s/boilerpipe/extractors/NumWordsRulesExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingWithMinKWordsExtractor.java src/main/de/l3s/boilerpipe/extractors/ExtractorBase.java src/main/de/l3s/boilerpipe/extractors/ArticleSentencesExtractor.java src/main/de/l3s/boilerpipe/extractors/CommonExtractors.java src/main/de/l3s/boilerpipe/extractors/CanolaExtractor.java src/main/de/l3s/boilerpipe/extractors/ArticleExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingExtractor.java src/main/de/l3s/boilerpipe/filters/english/HeuristicFilterBase.java src/main/de/l3s/boilerpipe/filters/english/KeepLargestFulltextBlockFilter.java src/main/de/l3s/boilerpipe/filters/english/TerminatingBlocksFinder.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFilter.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFromEndFilter.java src/main/de/l3s/boilerpipe/filters/english/DensityRulesClassifier.java src/main/de/l3s/boilerpipe/filters/english/MinFulltextWordsFilter.java src/main/de/l3s/boilerpipe/filters/english/NumWordsRulesClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/SimpleBlockFusionProcessor.java src/main/de/l3s/boilerpipe/filters/heuristics/BlockProximityFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/KeepLargestBlockFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/DocumentTitleMatchClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/LabelFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/AddPrecedingLabelsFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ExpandTitleToContentFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ContentFusion.java src/main/de/l3s/boilerpipe/filters/simple/MinWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToBoilerplateFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToContentFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/MinClauseWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/BoilerplateBlockFilter.java src/main/de/l3s/boilerpipe/filters/simple/SplitParagraphBlocksFilter.java src/main/de/l3s/boilerpipe/filters/simple/MarkEverythingContentFilter.java src/main/de/l3s/boilerpipe/labels/DefaultLabels.java src/main/de/l3s/boilerpipe/labels/ConditionalLabelAction.java src/main/de/l3s/boilerpipe/labels/LabelAction.java src/main/de/l3s/boilerpipe/sax/BoilerpipeSAXInput.java src/main/de/l3s/boilerpipe/sax/HTMLHighlighter.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLContentHandler.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLParser.java src/main/de/l3s/boilerpipe/sax/TagActionMap.java src/main/de/l3s/boilerpipe/sax/InputSourceable.java src/main/de/l3s/boilerpipe/sax/HTMLDocument.java src/main/de/l3s/boilerpipe/sax/CommonTagActions.java src/main/de/l3s/boilerpipe/sax/DefaultTagActionMap.java src/main/de/l3s/boilerpipe/sax/HTMLFetcher.java src/main/de/l3s/boilerpipe/sax/TagAction.java src/main/de/l3s/boilerpipe/sax/MarkupTagAction.java src/main/de/l3s/boilerpipe/util/UnicodeTokenizer.java + native2ascii -encoding UTF8 src/main/de/l3s/boilerpipe/filters/simple/LabelToBoilerplateFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToBoilerplateFilter.java + for s in src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeFilter.java src/main/de/l3s/boilerpipe/BoilerpipeExtractor.java src/main/de/l3s/boilerpipe/BoilerpipeProcessingException.java src/main/de/l3s/boilerpipe/conditions/TextBlockCondition.java src/main/de/l3s/boilerpipe/document/TextBlock.java src/main/de/l3s/boilerpipe/document/TextDocumentStatistics.java src/main/de/l3s/boilerpipe/document/TextDocument.java src/main/de/l3s/boilerpipe/estimators/SimpleEstimator.java src/main/de/l3s/boilerpipe/extractors/LargestContentExtractor.java src/main/de/l3s/boilerpipe/extractors/DefaultExtractor.java src/main/de/l3s/boilerpipe/extractors/NumWordsRulesExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingWithMinKWordsExtractor.java src/main/de/l3s/boilerpipe/extractors/ExtractorBase.java src/main/de/l3s/boilerpipe/extractors/ArticleSentencesExtractor.java src/main/de/l3s/boilerpipe/extractors/CommonExtractors.java src/main/de/l3s/boilerpipe/extractors/CanolaExtractor.java src/main/de/l3s/boilerpipe/extractors/ArticleExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingExtractor.java src/main/de/l3s/boilerpipe/filters/english/HeuristicFilterBase.java src/main/de/l3s/boilerpipe/filters/english/KeepLargestFulltextBlockFilter.java src/main/de/l3s/boilerpipe/filters/english/TerminatingBlocksFinder.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFilter.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFromEndFilter.java src/main/de/l3s/boilerpipe/filters/english/DensityRulesClassifier.java src/main/de/l3s/boilerpipe/filters/english/MinFulltextWordsFilter.java src/main/de/l3s/boilerpipe/filters/english/NumWordsRulesClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/SimpleBlockFusionProcessor.java src/main/de/l3s/boilerpipe/filters/heuristics/BlockProximityFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/KeepLargestBlockFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/DocumentTitleMatchClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/LabelFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/AddPrecedingLabelsFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ExpandTitleToContentFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ContentFusion.java src/main/de/l3s/boilerpipe/filters/simple/MinWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToBoilerplateFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToContentFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/MinClauseWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/BoilerplateBlockFilter.java src/main/de/l3s/boilerpipe/filters/simple/SplitParagraphBlocksFilter.java src/main/de/l3s/boilerpipe/filters/simple/MarkEverythingContentFilter.java src/main/de/l3s/boilerpipe/labels/DefaultLabels.java src/main/de/l3s/boilerpipe/labels/ConditionalLabelAction.java src/main/de/l3s/boilerpipe/labels/LabelAction.java src/main/de/l3s/boilerpipe/sax/BoilerpipeSAXInput.java src/main/de/l3s/boilerpipe/sax/HTMLHighlighter.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLContentHandler.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLParser.java src/main/de/l3s/boilerpipe/sax/TagActionMap.java src/main/de/l3s/boilerpipe/sax/InputSourceable.java src/main/de/l3s/boilerpipe/sax/HTMLDocument.java src/main/de/l3s/boilerpipe/sax/CommonTagActions.java src/main/de/l3s/boilerpipe/sax/DefaultTagActionMap.java src/main/de/l3s/boilerpipe/sax/HTMLFetcher.java src/main/de/l3s/boilerpipe/sax/TagAction.java src/main/de/l3s/boilerpipe/sax/MarkupTagAction.java src/main/de/l3s/boilerpipe/util/UnicodeTokenizer.java + native2ascii -encoding UTF8 src/main/de/l3s/boilerpipe/filters/simple/LabelToContentFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToContentFilter.java + for s in src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeFilter.java src/main/de/l3s/boilerpipe/BoilerpipeExtractor.java src/main/de/l3s/boilerpipe/BoilerpipeProcessingException.java src/main/de/l3s/boilerpipe/conditions/TextBlockCondition.java src/main/de/l3s/boilerpipe/document/TextBlock.java src/main/de/l3s/boilerpipe/document/TextDocumentStatistics.java src/main/de/l3s/boilerpipe/document/TextDocument.java src/main/de/l3s/boilerpipe/estimators/SimpleEstimator.java src/main/de/l3s/boilerpipe/extractors/LargestContentExtractor.java src/main/de/l3s/boilerpipe/extractors/DefaultExtractor.java src/main/de/l3s/boilerpipe/extractors/NumWordsRulesExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingWithMinKWordsExtractor.java src/main/de/l3s/boilerpipe/extractors/ExtractorBase.java src/main/de/l3s/boilerpipe/extractors/ArticleSentencesExtractor.java src/main/de/l3s/boilerpipe/extractors/CommonExtractors.java src/main/de/l3s/boilerpipe/extractors/CanolaExtractor.java src/main/de/l3s/boilerpipe/extractors/ArticleExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingExtractor.java src/main/de/l3s/boilerpipe/filters/english/HeuristicFilterBase.java src/main/de/l3s/boilerpipe/filters/english/KeepLargestFulltextBlockFilter.java src/main/de/l3s/boilerpipe/filters/english/TerminatingBlocksFinder.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFilter.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFromEndFilter.java src/main/de/l3s/boilerpipe/filters/english/DensityRulesClassifier.java src/main/de/l3s/boilerpipe/filters/english/MinFulltextWordsFilter.java src/main/de/l3s/boilerpipe/filters/english/NumWordsRulesClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/SimpleBlockFusionProcessor.java src/main/de/l3s/boilerpipe/filters/heuristics/BlockProximityFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/KeepLargestBlockFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/DocumentTitleMatchClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/LabelFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/AddPrecedingLabelsFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ExpandTitleToContentFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ContentFusion.java src/main/de/l3s/boilerpipe/filters/simple/MinWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToBoilerplateFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToContentFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/MinClauseWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/BoilerplateBlockFilter.java src/main/de/l3s/boilerpipe/filters/simple/SplitParagraphBlocksFilter.java src/main/de/l3s/boilerpipe/filters/simple/MarkEverythingContentFilter.java src/main/de/l3s/boilerpipe/labels/DefaultLabels.java src/main/de/l3s/boilerpipe/labels/ConditionalLabelAction.java src/main/de/l3s/boilerpipe/labels/LabelAction.java src/main/de/l3s/boilerpipe/sax/BoilerpipeSAXInput.java src/main/de/l3s/boilerpipe/sax/HTMLHighlighter.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLContentHandler.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLParser.java src/main/de/l3s/boilerpipe/sax/TagActionMap.java src/main/de/l3s/boilerpipe/sax/InputSourceable.java src/main/de/l3s/boilerpipe/sax/HTMLDocument.java src/main/de/l3s/boilerpipe/sax/CommonTagActions.java src/main/de/l3s/boilerpipe/sax/DefaultTagActionMap.java src/main/de/l3s/boilerpipe/sax/HTMLFetcher.java src/main/de/l3s/boilerpipe/sax/TagAction.java src/main/de/l3s/boilerpipe/sax/MarkupTagAction.java src/main/de/l3s/boilerpipe/util/UnicodeTokenizer.java + native2ascii -encoding UTF8 src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java + for s in src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeFilter.java src/main/de/l3s/boilerpipe/BoilerpipeExtractor.java src/main/de/l3s/boilerpipe/BoilerpipeProcessingException.java src/main/de/l3s/boilerpipe/conditions/TextBlockCondition.java src/main/de/l3s/boilerpipe/document/TextBlock.java src/main/de/l3s/boilerpipe/document/TextDocumentStatistics.java src/main/de/l3s/boilerpipe/document/TextDocument.java src/main/de/l3s/boilerpipe/estimators/SimpleEstimator.java src/main/de/l3s/boilerpipe/extractors/LargestContentExtractor.java src/main/de/l3s/boilerpipe/extractors/DefaultExtractor.java src/main/de/l3s/boilerpipe/extractors/NumWordsRulesExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingWithMinKWordsExtractor.java src/main/de/l3s/boilerpipe/extractors/ExtractorBase.java src/main/de/l3s/boilerpipe/extractors/ArticleSentencesExtractor.java src/main/de/l3s/boilerpipe/extractors/CommonExtractors.java src/main/de/l3s/boilerpipe/extractors/CanolaExtractor.java src/main/de/l3s/boilerpipe/extractors/ArticleExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingExtractor.java src/main/de/l3s/boilerpipe/filters/english/HeuristicFilterBase.java src/main/de/l3s/boilerpipe/filters/english/KeepLargestFulltextBlockFilter.java src/main/de/l3s/boilerpipe/filters/english/TerminatingBlocksFinder.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFilter.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFromEndFilter.java src/main/de/l3s/boilerpipe/filters/english/DensityRulesClassifier.java src/main/de/l3s/boilerpipe/filters/english/MinFulltextWordsFilter.java src/main/de/l3s/boilerpipe/filters/english/NumWordsRulesClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/SimpleBlockFusionProcessor.java src/main/de/l3s/boilerpipe/filters/heuristics/BlockProximityFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/KeepLargestBlockFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/DocumentTitleMatchClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/LabelFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/AddPrecedingLabelsFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ExpandTitleToContentFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ContentFusion.java src/main/de/l3s/boilerpipe/filters/simple/MinWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToBoilerplateFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToContentFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/MinClauseWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/BoilerplateBlockFilter.java src/main/de/l3s/boilerpipe/filters/simple/SplitParagraphBlocksFilter.java src/main/de/l3s/boilerpipe/filters/simple/MarkEverythingContentFilter.java src/main/de/l3s/boilerpipe/labels/DefaultLabels.java src/main/de/l3s/boilerpipe/labels/ConditionalLabelAction.java src/main/de/l3s/boilerpipe/labels/LabelAction.java src/main/de/l3s/boilerpipe/sax/BoilerpipeSAXInput.java src/main/de/l3s/boilerpipe/sax/HTMLHighlighter.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLContentHandler.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLParser.java src/main/de/l3s/boilerpipe/sax/TagActionMap.java src/main/de/l3s/boilerpipe/sax/InputSourceable.java src/main/de/l3s/boilerpipe/sax/HTMLDocument.java src/main/de/l3s/boilerpipe/sax/CommonTagActions.java src/main/de/l3s/boilerpipe/sax/DefaultTagActionMap.java src/main/de/l3s/boilerpipe/sax/HTMLFetcher.java src/main/de/l3s/boilerpipe/sax/TagAction.java src/main/de/l3s/boilerpipe/sax/MarkupTagAction.java src/main/de/l3s/boilerpipe/util/UnicodeTokenizer.java + native2ascii -encoding UTF8 src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java + for s in src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeFilter.java src/main/de/l3s/boilerpipe/BoilerpipeExtractor.java src/main/de/l3s/boilerpipe/BoilerpipeProcessingException.java src/main/de/l3s/boilerpipe/conditions/TextBlockCondition.java src/main/de/l3s/boilerpipe/document/TextBlock.java src/main/de/l3s/boilerpipe/document/TextDocumentStatistics.java src/main/de/l3s/boilerpipe/document/TextDocument.java src/main/de/l3s/boilerpipe/estimators/SimpleEstimator.java src/main/de/l3s/boilerpipe/extractors/LargestContentExtractor.java src/main/de/l3s/boilerpipe/extractors/DefaultExtractor.java src/main/de/l3s/boilerpipe/extractors/NumWordsRulesExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingWithMinKWordsExtractor.java src/main/de/l3s/boilerpipe/extractors/ExtractorBase.java src/main/de/l3s/boilerpipe/extractors/ArticleSentencesExtractor.java src/main/de/l3s/boilerpipe/extractors/CommonExtractors.java src/main/de/l3s/boilerpipe/extractors/CanolaExtractor.java src/main/de/l3s/boilerpipe/extractors/ArticleExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingExtractor.java src/main/de/l3s/boilerpipe/filters/english/HeuristicFilterBase.java src/main/de/l3s/boilerpipe/filters/english/KeepLargestFulltextBlockFilter.java src/main/de/l3s/boilerpipe/filters/english/TerminatingBlocksFinder.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFilter.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFromEndFilter.java src/main/de/l3s/boilerpipe/filters/english/DensityRulesClassifier.java src/main/de/l3s/boilerpipe/filters/english/MinFulltextWordsFilter.java src/main/de/l3s/boilerpipe/filters/english/NumWordsRulesClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/SimpleBlockFusionProcessor.java src/main/de/l3s/boilerpipe/filters/heuristics/BlockProximityFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/KeepLargestBlockFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/DocumentTitleMatchClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/LabelFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/AddPrecedingLabelsFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ExpandTitleToContentFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ContentFusion.java src/main/de/l3s/boilerpipe/filters/simple/MinWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToBoilerplateFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToContentFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/MinClauseWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/BoilerplateBlockFilter.java src/main/de/l3s/boilerpipe/filters/simple/SplitParagraphBlocksFilter.java src/main/de/l3s/boilerpipe/filters/simple/MarkEverythingContentFilter.java src/main/de/l3s/boilerpipe/labels/DefaultLabels.java src/main/de/l3s/boilerpipe/labels/ConditionalLabelAction.java src/main/de/l3s/boilerpipe/labels/LabelAction.java src/main/de/l3s/boilerpipe/sax/BoilerpipeSAXInput.java src/main/de/l3s/boilerpipe/sax/HTMLHighlighter.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLContentHandler.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLParser.java src/main/de/l3s/boilerpipe/sax/TagActionMap.java src/main/de/l3s/boilerpipe/sax/InputSourceable.java src/main/de/l3s/boilerpipe/sax/HTMLDocument.java src/main/de/l3s/boilerpipe/sax/CommonTagActions.java src/main/de/l3s/boilerpipe/sax/DefaultTagActionMap.java src/main/de/l3s/boilerpipe/sax/HTMLFetcher.java src/main/de/l3s/boilerpipe/sax/TagAction.java src/main/de/l3s/boilerpipe/sax/MarkupTagAction.java src/main/de/l3s/boilerpipe/util/UnicodeTokenizer.java + native2ascii -encoding UTF8 src/main/de/l3s/boilerpipe/filters/simple/MinClauseWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/MinClauseWordsFilter.java + for s in src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeFilter.java src/main/de/l3s/boilerpipe/BoilerpipeExtractor.java src/main/de/l3s/boilerpipe/BoilerpipeProcessingException.java src/main/de/l3s/boilerpipe/conditions/TextBlockCondition.java src/main/de/l3s/boilerpipe/document/TextBlock.java src/main/de/l3s/boilerpipe/document/TextDocumentStatistics.java src/main/de/l3s/boilerpipe/document/TextDocument.java src/main/de/l3s/boilerpipe/estimators/SimpleEstimator.java src/main/de/l3s/boilerpipe/extractors/LargestContentExtractor.java src/main/de/l3s/boilerpipe/extractors/DefaultExtractor.java src/main/de/l3s/boilerpipe/extractors/NumWordsRulesExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingWithMinKWordsExtractor.java src/main/de/l3s/boilerpipe/extractors/ExtractorBase.java src/main/de/l3s/boilerpipe/extractors/ArticleSentencesExtractor.java src/main/de/l3s/boilerpipe/extractors/CommonExtractors.java src/main/de/l3s/boilerpipe/extractors/CanolaExtractor.java src/main/de/l3s/boilerpipe/extractors/ArticleExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingExtractor.java src/main/de/l3s/boilerpipe/filters/english/HeuristicFilterBase.java src/main/de/l3s/boilerpipe/filters/english/KeepLargestFulltextBlockFilter.java src/main/de/l3s/boilerpipe/filters/english/TerminatingBlocksFinder.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFilter.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFromEndFilter.java src/main/de/l3s/boilerpipe/filters/english/DensityRulesClassifier.java src/main/de/l3s/boilerpipe/filters/english/MinFulltextWordsFilter.java src/main/de/l3s/boilerpipe/filters/english/NumWordsRulesClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/SimpleBlockFusionProcessor.java src/main/de/l3s/boilerpipe/filters/heuristics/BlockProximityFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/KeepLargestBlockFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/DocumentTitleMatchClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/LabelFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/AddPrecedingLabelsFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ExpandTitleToContentFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ContentFusion.java src/main/de/l3s/boilerpipe/filters/simple/MinWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToBoilerplateFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToContentFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/MinClauseWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/BoilerplateBlockFilter.java src/main/de/l3s/boilerpipe/filters/simple/SplitParagraphBlocksFilter.java src/main/de/l3s/boilerpipe/filters/simple/MarkEverythingContentFilter.java src/main/de/l3s/boilerpipe/labels/DefaultLabels.java src/main/de/l3s/boilerpipe/labels/ConditionalLabelAction.java src/main/de/l3s/boilerpipe/labels/LabelAction.java src/main/de/l3s/boilerpipe/sax/BoilerpipeSAXInput.java src/main/de/l3s/boilerpipe/sax/HTMLHighlighter.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLContentHandler.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLParser.java src/main/de/l3s/boilerpipe/sax/TagActionMap.java src/main/de/l3s/boilerpipe/sax/InputSourceable.java src/main/de/l3s/boilerpipe/sax/HTMLDocument.java src/main/de/l3s/boilerpipe/sax/CommonTagActions.java src/main/de/l3s/boilerpipe/sax/DefaultTagActionMap.java src/main/de/l3s/boilerpipe/sax/HTMLFetcher.java src/main/de/l3s/boilerpipe/sax/TagAction.java src/main/de/l3s/boilerpipe/sax/MarkupTagAction.java src/main/de/l3s/boilerpipe/util/UnicodeTokenizer.java + native2ascii -encoding UTF8 src/main/de/l3s/boilerpipe/filters/simple/BoilerplateBlockFilter.java src/main/de/l3s/boilerpipe/filters/simple/BoilerplateBlockFilter.java + for s in src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeFilter.java src/main/de/l3s/boilerpipe/BoilerpipeExtractor.java src/main/de/l3s/boilerpipe/BoilerpipeProcessingException.java src/main/de/l3s/boilerpipe/conditions/TextBlockCondition.java src/main/de/l3s/boilerpipe/document/TextBlock.java src/main/de/l3s/boilerpipe/document/TextDocumentStatistics.java src/main/de/l3s/boilerpipe/document/TextDocument.java src/main/de/l3s/boilerpipe/estimators/SimpleEstimator.java src/main/de/l3s/boilerpipe/extractors/LargestContentExtractor.java src/main/de/l3s/boilerpipe/extractors/DefaultExtractor.java src/main/de/l3s/boilerpipe/extractors/NumWordsRulesExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingWithMinKWordsExtractor.java src/main/de/l3s/boilerpipe/extractors/ExtractorBase.java src/main/de/l3s/boilerpipe/extractors/ArticleSentencesExtractor.java src/main/de/l3s/boilerpipe/extractors/CommonExtractors.java src/main/de/l3s/boilerpipe/extractors/CanolaExtractor.java src/main/de/l3s/boilerpipe/extractors/ArticleExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingExtractor.java src/main/de/l3s/boilerpipe/filters/english/HeuristicFilterBase.java src/main/de/l3s/boilerpipe/filters/english/KeepLargestFulltextBlockFilter.java src/main/de/l3s/boilerpipe/filters/english/TerminatingBlocksFinder.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFilter.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFromEndFilter.java src/main/de/l3s/boilerpipe/filters/english/DensityRulesClassifier.java src/main/de/l3s/boilerpipe/filters/english/MinFulltextWordsFilter.java src/main/de/l3s/boilerpipe/filters/english/NumWordsRulesClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/SimpleBlockFusionProcessor.java src/main/de/l3s/boilerpipe/filters/heuristics/BlockProximityFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/KeepLargestBlockFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/DocumentTitleMatchClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/LabelFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/AddPrecedingLabelsFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ExpandTitleToContentFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ContentFusion.java src/main/de/l3s/boilerpipe/filters/simple/MinWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToBoilerplateFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToContentFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/MinClauseWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/BoilerplateBlockFilter.java src/main/de/l3s/boilerpipe/filters/simple/SplitParagraphBlocksFilter.java src/main/de/l3s/boilerpipe/filters/simple/MarkEverythingContentFilter.java src/main/de/l3s/boilerpipe/labels/DefaultLabels.java src/main/de/l3s/boilerpipe/labels/ConditionalLabelAction.java src/main/de/l3s/boilerpipe/labels/LabelAction.java src/main/de/l3s/boilerpipe/sax/BoilerpipeSAXInput.java src/main/de/l3s/boilerpipe/sax/HTMLHighlighter.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLContentHandler.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLParser.java src/main/de/l3s/boilerpipe/sax/TagActionMap.java src/main/de/l3s/boilerpipe/sax/InputSourceable.java src/main/de/l3s/boilerpipe/sax/HTMLDocument.java src/main/de/l3s/boilerpipe/sax/CommonTagActions.java src/main/de/l3s/boilerpipe/sax/DefaultTagActionMap.java src/main/de/l3s/boilerpipe/sax/HTMLFetcher.java src/main/de/l3s/boilerpipe/sax/TagAction.java src/main/de/l3s/boilerpipe/sax/MarkupTagAction.java src/main/de/l3s/boilerpipe/util/UnicodeTokenizer.java + native2ascii -encoding UTF8 src/main/de/l3s/boilerpipe/filters/simple/SplitParagraphBlocksFilter.java src/main/de/l3s/boilerpipe/filters/simple/SplitParagraphBlocksFilter.java + for s in src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeFilter.java src/main/de/l3s/boilerpipe/BoilerpipeExtractor.java src/main/de/l3s/boilerpipe/BoilerpipeProcessingException.java src/main/de/l3s/boilerpipe/conditions/TextBlockCondition.java src/main/de/l3s/boilerpipe/document/TextBlock.java src/main/de/l3s/boilerpipe/document/TextDocumentStatistics.java src/main/de/l3s/boilerpipe/document/TextDocument.java src/main/de/l3s/boilerpipe/estimators/SimpleEstimator.java src/main/de/l3s/boilerpipe/extractors/LargestContentExtractor.java src/main/de/l3s/boilerpipe/extractors/DefaultExtractor.java src/main/de/l3s/boilerpipe/extractors/NumWordsRulesExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingWithMinKWordsExtractor.java src/main/de/l3s/boilerpipe/extractors/ExtractorBase.java src/main/de/l3s/boilerpipe/extractors/ArticleSentencesExtractor.java src/main/de/l3s/boilerpipe/extractors/CommonExtractors.java src/main/de/l3s/boilerpipe/extractors/CanolaExtractor.java src/main/de/l3s/boilerpipe/extractors/ArticleExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingExtractor.java src/main/de/l3s/boilerpipe/filters/english/HeuristicFilterBase.java src/main/de/l3s/boilerpipe/filters/english/KeepLargestFulltextBlockFilter.java src/main/de/l3s/boilerpipe/filters/english/TerminatingBlocksFinder.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFilter.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFromEndFilter.java src/main/de/l3s/boilerpipe/filters/english/DensityRulesClassifier.java src/main/de/l3s/boilerpipe/filters/english/MinFulltextWordsFilter.java src/main/de/l3s/boilerpipe/filters/english/NumWordsRulesClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/SimpleBlockFusionProcessor.java src/main/de/l3s/boilerpipe/filters/heuristics/BlockProximityFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/KeepLargestBlockFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/DocumentTitleMatchClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/LabelFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/AddPrecedingLabelsFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ExpandTitleToContentFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ContentFusion.java src/main/de/l3s/boilerpipe/filters/simple/MinWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToBoilerplateFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToContentFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/MinClauseWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/BoilerplateBlockFilter.java src/main/de/l3s/boilerpipe/filters/simple/SplitParagraphBlocksFilter.java src/main/de/l3s/boilerpipe/filters/simple/MarkEverythingContentFilter.java src/main/de/l3s/boilerpipe/labels/DefaultLabels.java src/main/de/l3s/boilerpipe/labels/ConditionalLabelAction.java src/main/de/l3s/boilerpipe/labels/LabelAction.java src/main/de/l3s/boilerpipe/sax/BoilerpipeSAXInput.java src/main/de/l3s/boilerpipe/sax/HTMLHighlighter.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLContentHandler.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLParser.java src/main/de/l3s/boilerpipe/sax/TagActionMap.java src/main/de/l3s/boilerpipe/sax/InputSourceable.java src/main/de/l3s/boilerpipe/sax/HTMLDocument.java src/main/de/l3s/boilerpipe/sax/CommonTagActions.java src/main/de/l3s/boilerpipe/sax/DefaultTagActionMap.java src/main/de/l3s/boilerpipe/sax/HTMLFetcher.java src/main/de/l3s/boilerpipe/sax/TagAction.java src/main/de/l3s/boilerpipe/sax/MarkupTagAction.java src/main/de/l3s/boilerpipe/util/UnicodeTokenizer.java + native2ascii -encoding UTF8 src/main/de/l3s/boilerpipe/filters/simple/MarkEverythingContentFilter.java src/main/de/l3s/boilerpipe/filters/simple/MarkEverythingContentFilter.java + for s in src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeFilter.java src/main/de/l3s/boilerpipe/BoilerpipeExtractor.java src/main/de/l3s/boilerpipe/BoilerpipeProcessingException.java src/main/de/l3s/boilerpipe/conditions/TextBlockCondition.java src/main/de/l3s/boilerpipe/document/TextBlock.java src/main/de/l3s/boilerpipe/document/TextDocumentStatistics.java src/main/de/l3s/boilerpipe/document/TextDocument.java src/main/de/l3s/boilerpipe/estimators/SimpleEstimator.java src/main/de/l3s/boilerpipe/extractors/LargestContentExtractor.java src/main/de/l3s/boilerpipe/extractors/DefaultExtractor.java src/main/de/l3s/boilerpipe/extractors/NumWordsRulesExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingWithMinKWordsExtractor.java src/main/de/l3s/boilerpipe/extractors/ExtractorBase.java src/main/de/l3s/boilerpipe/extractors/ArticleSentencesExtractor.java src/main/de/l3s/boilerpipe/extractors/CommonExtractors.java src/main/de/l3s/boilerpipe/extractors/CanolaExtractor.java src/main/de/l3s/boilerpipe/extractors/ArticleExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingExtractor.java src/main/de/l3s/boilerpipe/filters/english/HeuristicFilterBase.java src/main/de/l3s/boilerpipe/filters/english/KeepLargestFulltextBlockFilter.java src/main/de/l3s/boilerpipe/filters/english/TerminatingBlocksFinder.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFilter.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFromEndFilter.java src/main/de/l3s/boilerpipe/filters/english/DensityRulesClassifier.java src/main/de/l3s/boilerpipe/filters/english/MinFulltextWordsFilter.java src/main/de/l3s/boilerpipe/filters/english/NumWordsRulesClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/SimpleBlockFusionProcessor.java src/main/de/l3s/boilerpipe/filters/heuristics/BlockProximityFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/KeepLargestBlockFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/DocumentTitleMatchClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/LabelFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/AddPrecedingLabelsFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ExpandTitleToContentFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ContentFusion.java src/main/de/l3s/boilerpipe/filters/simple/MinWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToBoilerplateFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToContentFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/MinClauseWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/BoilerplateBlockFilter.java src/main/de/l3s/boilerpipe/filters/simple/SplitParagraphBlocksFilter.java src/main/de/l3s/boilerpipe/filters/simple/MarkEverythingContentFilter.java src/main/de/l3s/boilerpipe/labels/DefaultLabels.java src/main/de/l3s/boilerpipe/labels/ConditionalLabelAction.java src/main/de/l3s/boilerpipe/labels/LabelAction.java src/main/de/l3s/boilerpipe/sax/BoilerpipeSAXInput.java src/main/de/l3s/boilerpipe/sax/HTMLHighlighter.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLContentHandler.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLParser.java src/main/de/l3s/boilerpipe/sax/TagActionMap.java src/main/de/l3s/boilerpipe/sax/InputSourceable.java src/main/de/l3s/boilerpipe/sax/HTMLDocument.java src/main/de/l3s/boilerpipe/sax/CommonTagActions.java src/main/de/l3s/boilerpipe/sax/DefaultTagActionMap.java src/main/de/l3s/boilerpipe/sax/HTMLFetcher.java src/main/de/l3s/boilerpipe/sax/TagAction.java src/main/de/l3s/boilerpipe/sax/MarkupTagAction.java src/main/de/l3s/boilerpipe/util/UnicodeTokenizer.java + native2ascii -encoding UTF8 src/main/de/l3s/boilerpipe/labels/DefaultLabels.java src/main/de/l3s/boilerpipe/labels/DefaultLabels.java + for s in src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeFilter.java src/main/de/l3s/boilerpipe/BoilerpipeExtractor.java src/main/de/l3s/boilerpipe/BoilerpipeProcessingException.java src/main/de/l3s/boilerpipe/conditions/TextBlockCondition.java src/main/de/l3s/boilerpipe/document/TextBlock.java src/main/de/l3s/boilerpipe/document/TextDocumentStatistics.java src/main/de/l3s/boilerpipe/document/TextDocument.java src/main/de/l3s/boilerpipe/estimators/SimpleEstimator.java src/main/de/l3s/boilerpipe/extractors/LargestContentExtractor.java src/main/de/l3s/boilerpipe/extractors/DefaultExtractor.java src/main/de/l3s/boilerpipe/extractors/NumWordsRulesExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingWithMinKWordsExtractor.java src/main/de/l3s/boilerpipe/extractors/ExtractorBase.java src/main/de/l3s/boilerpipe/extractors/ArticleSentencesExtractor.java src/main/de/l3s/boilerpipe/extractors/CommonExtractors.java src/main/de/l3s/boilerpipe/extractors/CanolaExtractor.java src/main/de/l3s/boilerpipe/extractors/ArticleExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingExtractor.java src/main/de/l3s/boilerpipe/filters/english/HeuristicFilterBase.java src/main/de/l3s/boilerpipe/filters/english/KeepLargestFulltextBlockFilter.java src/main/de/l3s/boilerpipe/filters/english/TerminatingBlocksFinder.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFilter.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFromEndFilter.java src/main/de/l3s/boilerpipe/filters/english/DensityRulesClassifier.java src/main/de/l3s/boilerpipe/filters/english/MinFulltextWordsFilter.java src/main/de/l3s/boilerpipe/filters/english/NumWordsRulesClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/SimpleBlockFusionProcessor.java src/main/de/l3s/boilerpipe/filters/heuristics/BlockProximityFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/KeepLargestBlockFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/DocumentTitleMatchClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/LabelFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/AddPrecedingLabelsFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ExpandTitleToContentFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ContentFusion.java src/main/de/l3s/boilerpipe/filters/simple/MinWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToBoilerplateFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToContentFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/MinClauseWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/BoilerplateBlockFilter.java src/main/de/l3s/boilerpipe/filters/simple/SplitParagraphBlocksFilter.java src/main/de/l3s/boilerpipe/filters/simple/MarkEverythingContentFilter.java src/main/de/l3s/boilerpipe/labels/DefaultLabels.java src/main/de/l3s/boilerpipe/labels/ConditionalLabelAction.java src/main/de/l3s/boilerpipe/labels/LabelAction.java src/main/de/l3s/boilerpipe/sax/BoilerpipeSAXInput.java src/main/de/l3s/boilerpipe/sax/HTMLHighlighter.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLContentHandler.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLParser.java src/main/de/l3s/boilerpipe/sax/TagActionMap.java src/main/de/l3s/boilerpipe/sax/InputSourceable.java src/main/de/l3s/boilerpipe/sax/HTMLDocument.java src/main/de/l3s/boilerpipe/sax/CommonTagActions.java src/main/de/l3s/boilerpipe/sax/DefaultTagActionMap.java src/main/de/l3s/boilerpipe/sax/HTMLFetcher.java src/main/de/l3s/boilerpipe/sax/TagAction.java src/main/de/l3s/boilerpipe/sax/MarkupTagAction.java src/main/de/l3s/boilerpipe/util/UnicodeTokenizer.java + native2ascii -encoding UTF8 src/main/de/l3s/boilerpipe/labels/ConditionalLabelAction.java src/main/de/l3s/boilerpipe/labels/ConditionalLabelAction.java + for s in src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeFilter.java src/main/de/l3s/boilerpipe/BoilerpipeExtractor.java src/main/de/l3s/boilerpipe/BoilerpipeProcessingException.java src/main/de/l3s/boilerpipe/conditions/TextBlockCondition.java src/main/de/l3s/boilerpipe/document/TextBlock.java src/main/de/l3s/boilerpipe/document/TextDocumentStatistics.java src/main/de/l3s/boilerpipe/document/TextDocument.java src/main/de/l3s/boilerpipe/estimators/SimpleEstimator.java src/main/de/l3s/boilerpipe/extractors/LargestContentExtractor.java src/main/de/l3s/boilerpipe/extractors/DefaultExtractor.java src/main/de/l3s/boilerpipe/extractors/NumWordsRulesExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingWithMinKWordsExtractor.java src/main/de/l3s/boilerpipe/extractors/ExtractorBase.java src/main/de/l3s/boilerpipe/extractors/ArticleSentencesExtractor.java src/main/de/l3s/boilerpipe/extractors/CommonExtractors.java src/main/de/l3s/boilerpipe/extractors/CanolaExtractor.java src/main/de/l3s/boilerpipe/extractors/ArticleExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingExtractor.java src/main/de/l3s/boilerpipe/filters/english/HeuristicFilterBase.java src/main/de/l3s/boilerpipe/filters/english/KeepLargestFulltextBlockFilter.java src/main/de/l3s/boilerpipe/filters/english/TerminatingBlocksFinder.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFilter.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFromEndFilter.java src/main/de/l3s/boilerpipe/filters/english/DensityRulesClassifier.java src/main/de/l3s/boilerpipe/filters/english/MinFulltextWordsFilter.java src/main/de/l3s/boilerpipe/filters/english/NumWordsRulesClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/SimpleBlockFusionProcessor.java src/main/de/l3s/boilerpipe/filters/heuristics/BlockProximityFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/KeepLargestBlockFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/DocumentTitleMatchClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/LabelFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/AddPrecedingLabelsFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ExpandTitleToContentFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ContentFusion.java src/main/de/l3s/boilerpipe/filters/simple/MinWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToBoilerplateFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToContentFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/MinClauseWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/BoilerplateBlockFilter.java src/main/de/l3s/boilerpipe/filters/simple/SplitParagraphBlocksFilter.java src/main/de/l3s/boilerpipe/filters/simple/MarkEverythingContentFilter.java src/main/de/l3s/boilerpipe/labels/DefaultLabels.java src/main/de/l3s/boilerpipe/labels/ConditionalLabelAction.java src/main/de/l3s/boilerpipe/labels/LabelAction.java src/main/de/l3s/boilerpipe/sax/BoilerpipeSAXInput.java src/main/de/l3s/boilerpipe/sax/HTMLHighlighter.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLContentHandler.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLParser.java src/main/de/l3s/boilerpipe/sax/TagActionMap.java src/main/de/l3s/boilerpipe/sax/InputSourceable.java src/main/de/l3s/boilerpipe/sax/HTMLDocument.java src/main/de/l3s/boilerpipe/sax/CommonTagActions.java src/main/de/l3s/boilerpipe/sax/DefaultTagActionMap.java src/main/de/l3s/boilerpipe/sax/HTMLFetcher.java src/main/de/l3s/boilerpipe/sax/TagAction.java src/main/de/l3s/boilerpipe/sax/MarkupTagAction.java src/main/de/l3s/boilerpipe/util/UnicodeTokenizer.java + native2ascii -encoding UTF8 src/main/de/l3s/boilerpipe/labels/LabelAction.java src/main/de/l3s/boilerpipe/labels/LabelAction.java + for s in src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeFilter.java src/main/de/l3s/boilerpipe/BoilerpipeExtractor.java src/main/de/l3s/boilerpipe/BoilerpipeProcessingException.java src/main/de/l3s/boilerpipe/conditions/TextBlockCondition.java src/main/de/l3s/boilerpipe/document/TextBlock.java src/main/de/l3s/boilerpipe/document/TextDocumentStatistics.java src/main/de/l3s/boilerpipe/document/TextDocument.java src/main/de/l3s/boilerpipe/estimators/SimpleEstimator.java src/main/de/l3s/boilerpipe/extractors/LargestContentExtractor.java src/main/de/l3s/boilerpipe/extractors/DefaultExtractor.java src/main/de/l3s/boilerpipe/extractors/NumWordsRulesExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingWithMinKWordsExtractor.java src/main/de/l3s/boilerpipe/extractors/ExtractorBase.java src/main/de/l3s/boilerpipe/extractors/ArticleSentencesExtractor.java src/main/de/l3s/boilerpipe/extractors/CommonExtractors.java src/main/de/l3s/boilerpipe/extractors/CanolaExtractor.java src/main/de/l3s/boilerpipe/extractors/ArticleExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingExtractor.java src/main/de/l3s/boilerpipe/filters/english/HeuristicFilterBase.java src/main/de/l3s/boilerpipe/filters/english/KeepLargestFulltextBlockFilter.java src/main/de/l3s/boilerpipe/filters/english/TerminatingBlocksFinder.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFilter.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFromEndFilter.java src/main/de/l3s/boilerpipe/filters/english/DensityRulesClassifier.java src/main/de/l3s/boilerpipe/filters/english/MinFulltextWordsFilter.java src/main/de/l3s/boilerpipe/filters/english/NumWordsRulesClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/SimpleBlockFusionProcessor.java src/main/de/l3s/boilerpipe/filters/heuristics/BlockProximityFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/KeepLargestBlockFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/DocumentTitleMatchClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/LabelFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/AddPrecedingLabelsFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ExpandTitleToContentFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ContentFusion.java src/main/de/l3s/boilerpipe/filters/simple/MinWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToBoilerplateFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToContentFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/MinClauseWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/BoilerplateBlockFilter.java src/main/de/l3s/boilerpipe/filters/simple/SplitParagraphBlocksFilter.java src/main/de/l3s/boilerpipe/filters/simple/MarkEverythingContentFilter.java src/main/de/l3s/boilerpipe/labels/DefaultLabels.java src/main/de/l3s/boilerpipe/labels/ConditionalLabelAction.java src/main/de/l3s/boilerpipe/labels/LabelAction.java src/main/de/l3s/boilerpipe/sax/BoilerpipeSAXInput.java src/main/de/l3s/boilerpipe/sax/HTMLHighlighter.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLContentHandler.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLParser.java src/main/de/l3s/boilerpipe/sax/TagActionMap.java src/main/de/l3s/boilerpipe/sax/InputSourceable.java src/main/de/l3s/boilerpipe/sax/HTMLDocument.java src/main/de/l3s/boilerpipe/sax/CommonTagActions.java src/main/de/l3s/boilerpipe/sax/DefaultTagActionMap.java src/main/de/l3s/boilerpipe/sax/HTMLFetcher.java src/main/de/l3s/boilerpipe/sax/TagAction.java src/main/de/l3s/boilerpipe/sax/MarkupTagAction.java src/main/de/l3s/boilerpipe/util/UnicodeTokenizer.java + native2ascii -encoding UTF8 src/main/de/l3s/boilerpipe/sax/BoilerpipeSAXInput.java src/main/de/l3s/boilerpipe/sax/BoilerpipeSAXInput.java + for s in src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeFilter.java src/main/de/l3s/boilerpipe/BoilerpipeExtractor.java src/main/de/l3s/boilerpipe/BoilerpipeProcessingException.java src/main/de/l3s/boilerpipe/conditions/TextBlockCondition.java src/main/de/l3s/boilerpipe/document/TextBlock.java src/main/de/l3s/boilerpipe/document/TextDocumentStatistics.java src/main/de/l3s/boilerpipe/document/TextDocument.java src/main/de/l3s/boilerpipe/estimators/SimpleEstimator.java src/main/de/l3s/boilerpipe/extractors/LargestContentExtractor.java src/main/de/l3s/boilerpipe/extractors/DefaultExtractor.java src/main/de/l3s/boilerpipe/extractors/NumWordsRulesExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingWithMinKWordsExtractor.java src/main/de/l3s/boilerpipe/extractors/ExtractorBase.java src/main/de/l3s/boilerpipe/extractors/ArticleSentencesExtractor.java src/main/de/l3s/boilerpipe/extractors/CommonExtractors.java src/main/de/l3s/boilerpipe/extractors/CanolaExtractor.java src/main/de/l3s/boilerpipe/extractors/ArticleExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingExtractor.java src/main/de/l3s/boilerpipe/filters/english/HeuristicFilterBase.java src/main/de/l3s/boilerpipe/filters/english/KeepLargestFulltextBlockFilter.java src/main/de/l3s/boilerpipe/filters/english/TerminatingBlocksFinder.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFilter.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFromEndFilter.java src/main/de/l3s/boilerpipe/filters/english/DensityRulesClassifier.java src/main/de/l3s/boilerpipe/filters/english/MinFulltextWordsFilter.java src/main/de/l3s/boilerpipe/filters/english/NumWordsRulesClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/SimpleBlockFusionProcessor.java src/main/de/l3s/boilerpipe/filters/heuristics/BlockProximityFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/KeepLargestBlockFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/DocumentTitleMatchClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/LabelFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/AddPrecedingLabelsFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ExpandTitleToContentFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ContentFusion.java src/main/de/l3s/boilerpipe/filters/simple/MinWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToBoilerplateFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToContentFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/MinClauseWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/BoilerplateBlockFilter.java src/main/de/l3s/boilerpipe/filters/simple/SplitParagraphBlocksFilter.java src/main/de/l3s/boilerpipe/filters/simple/MarkEverythingContentFilter.java src/main/de/l3s/boilerpipe/labels/DefaultLabels.java src/main/de/l3s/boilerpipe/labels/ConditionalLabelAction.java src/main/de/l3s/boilerpipe/labels/LabelAction.java src/main/de/l3s/boilerpipe/sax/BoilerpipeSAXInput.java src/main/de/l3s/boilerpipe/sax/HTMLHighlighter.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLContentHandler.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLParser.java src/main/de/l3s/boilerpipe/sax/TagActionMap.java src/main/de/l3s/boilerpipe/sax/InputSourceable.java src/main/de/l3s/boilerpipe/sax/HTMLDocument.java src/main/de/l3s/boilerpipe/sax/CommonTagActions.java src/main/de/l3s/boilerpipe/sax/DefaultTagActionMap.java src/main/de/l3s/boilerpipe/sax/HTMLFetcher.java src/main/de/l3s/boilerpipe/sax/TagAction.java src/main/de/l3s/boilerpipe/sax/MarkupTagAction.java src/main/de/l3s/boilerpipe/util/UnicodeTokenizer.java + native2ascii -encoding UTF8 src/main/de/l3s/boilerpipe/sax/HTMLHighlighter.java src/main/de/l3s/boilerpipe/sax/HTMLHighlighter.java + for s in src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeFilter.java src/main/de/l3s/boilerpipe/BoilerpipeExtractor.java src/main/de/l3s/boilerpipe/BoilerpipeProcessingException.java src/main/de/l3s/boilerpipe/conditions/TextBlockCondition.java src/main/de/l3s/boilerpipe/document/TextBlock.java src/main/de/l3s/boilerpipe/document/TextDocumentStatistics.java src/main/de/l3s/boilerpipe/document/TextDocument.java src/main/de/l3s/boilerpipe/estimators/SimpleEstimator.java src/main/de/l3s/boilerpipe/extractors/LargestContentExtractor.java src/main/de/l3s/boilerpipe/extractors/DefaultExtractor.java src/main/de/l3s/boilerpipe/extractors/NumWordsRulesExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingWithMinKWordsExtractor.java src/main/de/l3s/boilerpipe/extractors/ExtractorBase.java src/main/de/l3s/boilerpipe/extractors/ArticleSentencesExtractor.java src/main/de/l3s/boilerpipe/extractors/CommonExtractors.java src/main/de/l3s/boilerpipe/extractors/CanolaExtractor.java src/main/de/l3s/boilerpipe/extractors/ArticleExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingExtractor.java src/main/de/l3s/boilerpipe/filters/english/HeuristicFilterBase.java src/main/de/l3s/boilerpipe/filters/english/KeepLargestFulltextBlockFilter.java src/main/de/l3s/boilerpipe/filters/english/TerminatingBlocksFinder.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFilter.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFromEndFilter.java src/main/de/l3s/boilerpipe/filters/english/DensityRulesClassifier.java src/main/de/l3s/boilerpipe/filters/english/MinFulltextWordsFilter.java src/main/de/l3s/boilerpipe/filters/english/NumWordsRulesClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/SimpleBlockFusionProcessor.java src/main/de/l3s/boilerpipe/filters/heuristics/BlockProximityFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/KeepLargestBlockFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/DocumentTitleMatchClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/LabelFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/AddPrecedingLabelsFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ExpandTitleToContentFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ContentFusion.java src/main/de/l3s/boilerpipe/filters/simple/MinWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToBoilerplateFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToContentFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/MinClauseWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/BoilerplateBlockFilter.java src/main/de/l3s/boilerpipe/filters/simple/SplitParagraphBlocksFilter.java src/main/de/l3s/boilerpipe/filters/simple/MarkEverythingContentFilter.java src/main/de/l3s/boilerpipe/labels/DefaultLabels.java src/main/de/l3s/boilerpipe/labels/ConditionalLabelAction.java src/main/de/l3s/boilerpipe/labels/LabelAction.java src/main/de/l3s/boilerpipe/sax/BoilerpipeSAXInput.java src/main/de/l3s/boilerpipe/sax/HTMLHighlighter.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLContentHandler.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLParser.java src/main/de/l3s/boilerpipe/sax/TagActionMap.java src/main/de/l3s/boilerpipe/sax/InputSourceable.java src/main/de/l3s/boilerpipe/sax/HTMLDocument.java src/main/de/l3s/boilerpipe/sax/CommonTagActions.java src/main/de/l3s/boilerpipe/sax/DefaultTagActionMap.java src/main/de/l3s/boilerpipe/sax/HTMLFetcher.java src/main/de/l3s/boilerpipe/sax/TagAction.java src/main/de/l3s/boilerpipe/sax/MarkupTagAction.java src/main/de/l3s/boilerpipe/util/UnicodeTokenizer.java + native2ascii -encoding UTF8 src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLContentHandler.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLContentHandler.java + for s in src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeFilter.java src/main/de/l3s/boilerpipe/BoilerpipeExtractor.java src/main/de/l3s/boilerpipe/BoilerpipeProcessingException.java src/main/de/l3s/boilerpipe/conditions/TextBlockCondition.java src/main/de/l3s/boilerpipe/document/TextBlock.java src/main/de/l3s/boilerpipe/document/TextDocumentStatistics.java src/main/de/l3s/boilerpipe/document/TextDocument.java src/main/de/l3s/boilerpipe/estimators/SimpleEstimator.java src/main/de/l3s/boilerpipe/extractors/LargestContentExtractor.java src/main/de/l3s/boilerpipe/extractors/DefaultExtractor.java src/main/de/l3s/boilerpipe/extractors/NumWordsRulesExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingWithMinKWordsExtractor.java src/main/de/l3s/boilerpipe/extractors/ExtractorBase.java src/main/de/l3s/boilerpipe/extractors/ArticleSentencesExtractor.java src/main/de/l3s/boilerpipe/extractors/CommonExtractors.java src/main/de/l3s/boilerpipe/extractors/CanolaExtractor.java src/main/de/l3s/boilerpipe/extractors/ArticleExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingExtractor.java src/main/de/l3s/boilerpipe/filters/english/HeuristicFilterBase.java src/main/de/l3s/boilerpipe/filters/english/KeepLargestFulltextBlockFilter.java src/main/de/l3s/boilerpipe/filters/english/TerminatingBlocksFinder.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFilter.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFromEndFilter.java src/main/de/l3s/boilerpipe/filters/english/DensityRulesClassifier.java src/main/de/l3s/boilerpipe/filters/english/MinFulltextWordsFilter.java src/main/de/l3s/boilerpipe/filters/english/NumWordsRulesClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/SimpleBlockFusionProcessor.java src/main/de/l3s/boilerpipe/filters/heuristics/BlockProximityFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/KeepLargestBlockFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/DocumentTitleMatchClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/LabelFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/AddPrecedingLabelsFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ExpandTitleToContentFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ContentFusion.java src/main/de/l3s/boilerpipe/filters/simple/MinWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToBoilerplateFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToContentFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/MinClauseWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/BoilerplateBlockFilter.java src/main/de/l3s/boilerpipe/filters/simple/SplitParagraphBlocksFilter.java src/main/de/l3s/boilerpipe/filters/simple/MarkEverythingContentFilter.java src/main/de/l3s/boilerpipe/labels/DefaultLabels.java src/main/de/l3s/boilerpipe/labels/ConditionalLabelAction.java src/main/de/l3s/boilerpipe/labels/LabelAction.java src/main/de/l3s/boilerpipe/sax/BoilerpipeSAXInput.java src/main/de/l3s/boilerpipe/sax/HTMLHighlighter.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLContentHandler.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLParser.java src/main/de/l3s/boilerpipe/sax/TagActionMap.java src/main/de/l3s/boilerpipe/sax/InputSourceable.java src/main/de/l3s/boilerpipe/sax/HTMLDocument.java src/main/de/l3s/boilerpipe/sax/CommonTagActions.java src/main/de/l3s/boilerpipe/sax/DefaultTagActionMap.java src/main/de/l3s/boilerpipe/sax/HTMLFetcher.java src/main/de/l3s/boilerpipe/sax/TagAction.java src/main/de/l3s/boilerpipe/sax/MarkupTagAction.java src/main/de/l3s/boilerpipe/util/UnicodeTokenizer.java + native2ascii -encoding UTF8 src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLParser.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLParser.java + for s in src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeFilter.java src/main/de/l3s/boilerpipe/BoilerpipeExtractor.java src/main/de/l3s/boilerpipe/BoilerpipeProcessingException.java src/main/de/l3s/boilerpipe/conditions/TextBlockCondition.java src/main/de/l3s/boilerpipe/document/TextBlock.java src/main/de/l3s/boilerpipe/document/TextDocumentStatistics.java src/main/de/l3s/boilerpipe/document/TextDocument.java src/main/de/l3s/boilerpipe/estimators/SimpleEstimator.java src/main/de/l3s/boilerpipe/extractors/LargestContentExtractor.java src/main/de/l3s/boilerpipe/extractors/DefaultExtractor.java src/main/de/l3s/boilerpipe/extractors/NumWordsRulesExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingWithMinKWordsExtractor.java src/main/de/l3s/boilerpipe/extractors/ExtractorBase.java src/main/de/l3s/boilerpipe/extractors/ArticleSentencesExtractor.java src/main/de/l3s/boilerpipe/extractors/CommonExtractors.java src/main/de/l3s/boilerpipe/extractors/CanolaExtractor.java src/main/de/l3s/boilerpipe/extractors/ArticleExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingExtractor.java src/main/de/l3s/boilerpipe/filters/english/HeuristicFilterBase.java src/main/de/l3s/boilerpipe/filters/english/KeepLargestFulltextBlockFilter.java src/main/de/l3s/boilerpipe/filters/english/TerminatingBlocksFinder.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFilter.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFromEndFilter.java src/main/de/l3s/boilerpipe/filters/english/DensityRulesClassifier.java src/main/de/l3s/boilerpipe/filters/english/MinFulltextWordsFilter.java src/main/de/l3s/boilerpipe/filters/english/NumWordsRulesClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/SimpleBlockFusionProcessor.java src/main/de/l3s/boilerpipe/filters/heuristics/BlockProximityFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/KeepLargestBlockFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/DocumentTitleMatchClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/LabelFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/AddPrecedingLabelsFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ExpandTitleToContentFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ContentFusion.java src/main/de/l3s/boilerpipe/filters/simple/MinWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToBoilerplateFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToContentFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/MinClauseWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/BoilerplateBlockFilter.java src/main/de/l3s/boilerpipe/filters/simple/SplitParagraphBlocksFilter.java src/main/de/l3s/boilerpipe/filters/simple/MarkEverythingContentFilter.java src/main/de/l3s/boilerpipe/labels/DefaultLabels.java src/main/de/l3s/boilerpipe/labels/ConditionalLabelAction.java src/main/de/l3s/boilerpipe/labels/LabelAction.java src/main/de/l3s/boilerpipe/sax/BoilerpipeSAXInput.java src/main/de/l3s/boilerpipe/sax/HTMLHighlighter.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLContentHandler.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLParser.java src/main/de/l3s/boilerpipe/sax/TagActionMap.java src/main/de/l3s/boilerpipe/sax/InputSourceable.java src/main/de/l3s/boilerpipe/sax/HTMLDocument.java src/main/de/l3s/boilerpipe/sax/CommonTagActions.java src/main/de/l3s/boilerpipe/sax/DefaultTagActionMap.java src/main/de/l3s/boilerpipe/sax/HTMLFetcher.java src/main/de/l3s/boilerpipe/sax/TagAction.java src/main/de/l3s/boilerpipe/sax/MarkupTagAction.java src/main/de/l3s/boilerpipe/util/UnicodeTokenizer.java + native2ascii -encoding UTF8 src/main/de/l3s/boilerpipe/sax/TagActionMap.java src/main/de/l3s/boilerpipe/sax/TagActionMap.java + for s in src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeFilter.java src/main/de/l3s/boilerpipe/BoilerpipeExtractor.java src/main/de/l3s/boilerpipe/BoilerpipeProcessingException.java src/main/de/l3s/boilerpipe/conditions/TextBlockCondition.java src/main/de/l3s/boilerpipe/document/TextBlock.java src/main/de/l3s/boilerpipe/document/TextDocumentStatistics.java src/main/de/l3s/boilerpipe/document/TextDocument.java src/main/de/l3s/boilerpipe/estimators/SimpleEstimator.java src/main/de/l3s/boilerpipe/extractors/LargestContentExtractor.java src/main/de/l3s/boilerpipe/extractors/DefaultExtractor.java src/main/de/l3s/boilerpipe/extractors/NumWordsRulesExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingWithMinKWordsExtractor.java src/main/de/l3s/boilerpipe/extractors/ExtractorBase.java src/main/de/l3s/boilerpipe/extractors/ArticleSentencesExtractor.java src/main/de/l3s/boilerpipe/extractors/CommonExtractors.java src/main/de/l3s/boilerpipe/extractors/CanolaExtractor.java src/main/de/l3s/boilerpipe/extractors/ArticleExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingExtractor.java src/main/de/l3s/boilerpipe/filters/english/HeuristicFilterBase.java src/main/de/l3s/boilerpipe/filters/english/KeepLargestFulltextBlockFilter.java src/main/de/l3s/boilerpipe/filters/english/TerminatingBlocksFinder.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFilter.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFromEndFilter.java src/main/de/l3s/boilerpipe/filters/english/DensityRulesClassifier.java src/main/de/l3s/boilerpipe/filters/english/MinFulltextWordsFilter.java src/main/de/l3s/boilerpipe/filters/english/NumWordsRulesClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/SimpleBlockFusionProcessor.java src/main/de/l3s/boilerpipe/filters/heuristics/BlockProximityFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/KeepLargestBlockFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/DocumentTitleMatchClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/LabelFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/AddPrecedingLabelsFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ExpandTitleToContentFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ContentFusion.java src/main/de/l3s/boilerpipe/filters/simple/MinWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToBoilerplateFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToContentFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/MinClauseWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/BoilerplateBlockFilter.java src/main/de/l3s/boilerpipe/filters/simple/SplitParagraphBlocksFilter.java src/main/de/l3s/boilerpipe/filters/simple/MarkEverythingContentFilter.java src/main/de/l3s/boilerpipe/labels/DefaultLabels.java src/main/de/l3s/boilerpipe/labels/ConditionalLabelAction.java src/main/de/l3s/boilerpipe/labels/LabelAction.java src/main/de/l3s/boilerpipe/sax/BoilerpipeSAXInput.java src/main/de/l3s/boilerpipe/sax/HTMLHighlighter.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLContentHandler.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLParser.java src/main/de/l3s/boilerpipe/sax/TagActionMap.java src/main/de/l3s/boilerpipe/sax/InputSourceable.java src/main/de/l3s/boilerpipe/sax/HTMLDocument.java src/main/de/l3s/boilerpipe/sax/CommonTagActions.java src/main/de/l3s/boilerpipe/sax/DefaultTagActionMap.java src/main/de/l3s/boilerpipe/sax/HTMLFetcher.java src/main/de/l3s/boilerpipe/sax/TagAction.java src/main/de/l3s/boilerpipe/sax/MarkupTagAction.java src/main/de/l3s/boilerpipe/util/UnicodeTokenizer.java + native2ascii -encoding UTF8 src/main/de/l3s/boilerpipe/sax/InputSourceable.java src/main/de/l3s/boilerpipe/sax/InputSourceable.java + for s in src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeFilter.java src/main/de/l3s/boilerpipe/BoilerpipeExtractor.java src/main/de/l3s/boilerpipe/BoilerpipeProcessingException.java src/main/de/l3s/boilerpipe/conditions/TextBlockCondition.java src/main/de/l3s/boilerpipe/document/TextBlock.java src/main/de/l3s/boilerpipe/document/TextDocumentStatistics.java src/main/de/l3s/boilerpipe/document/TextDocument.java src/main/de/l3s/boilerpipe/estimators/SimpleEstimator.java src/main/de/l3s/boilerpipe/extractors/LargestContentExtractor.java src/main/de/l3s/boilerpipe/extractors/DefaultExtractor.java src/main/de/l3s/boilerpipe/extractors/NumWordsRulesExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingWithMinKWordsExtractor.java src/main/de/l3s/boilerpipe/extractors/ExtractorBase.java src/main/de/l3s/boilerpipe/extractors/ArticleSentencesExtractor.java src/main/de/l3s/boilerpipe/extractors/CommonExtractors.java src/main/de/l3s/boilerpipe/extractors/CanolaExtractor.java src/main/de/l3s/boilerpipe/extractors/ArticleExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingExtractor.java src/main/de/l3s/boilerpipe/filters/english/HeuristicFilterBase.java src/main/de/l3s/boilerpipe/filters/english/KeepLargestFulltextBlockFilter.java src/main/de/l3s/boilerpipe/filters/english/TerminatingBlocksFinder.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFilter.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFromEndFilter.java src/main/de/l3s/boilerpipe/filters/english/DensityRulesClassifier.java src/main/de/l3s/boilerpipe/filters/english/MinFulltextWordsFilter.java src/main/de/l3s/boilerpipe/filters/english/NumWordsRulesClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/SimpleBlockFusionProcessor.java src/main/de/l3s/boilerpipe/filters/heuristics/BlockProximityFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/KeepLargestBlockFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/DocumentTitleMatchClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/LabelFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/AddPrecedingLabelsFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ExpandTitleToContentFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ContentFusion.java src/main/de/l3s/boilerpipe/filters/simple/MinWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToBoilerplateFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToContentFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/MinClauseWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/BoilerplateBlockFilter.java src/main/de/l3s/boilerpipe/filters/simple/SplitParagraphBlocksFilter.java src/main/de/l3s/boilerpipe/filters/simple/MarkEverythingContentFilter.java src/main/de/l3s/boilerpipe/labels/DefaultLabels.java src/main/de/l3s/boilerpipe/labels/ConditionalLabelAction.java src/main/de/l3s/boilerpipe/labels/LabelAction.java src/main/de/l3s/boilerpipe/sax/BoilerpipeSAXInput.java src/main/de/l3s/boilerpipe/sax/HTMLHighlighter.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLContentHandler.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLParser.java src/main/de/l3s/boilerpipe/sax/TagActionMap.java src/main/de/l3s/boilerpipe/sax/InputSourceable.java src/main/de/l3s/boilerpipe/sax/HTMLDocument.java src/main/de/l3s/boilerpipe/sax/CommonTagActions.java src/main/de/l3s/boilerpipe/sax/DefaultTagActionMap.java src/main/de/l3s/boilerpipe/sax/HTMLFetcher.java src/main/de/l3s/boilerpipe/sax/TagAction.java src/main/de/l3s/boilerpipe/sax/MarkupTagAction.java src/main/de/l3s/boilerpipe/util/UnicodeTokenizer.java + native2ascii -encoding UTF8 src/main/de/l3s/boilerpipe/sax/HTMLDocument.java src/main/de/l3s/boilerpipe/sax/HTMLDocument.java + for s in src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeFilter.java src/main/de/l3s/boilerpipe/BoilerpipeExtractor.java src/main/de/l3s/boilerpipe/BoilerpipeProcessingException.java src/main/de/l3s/boilerpipe/conditions/TextBlockCondition.java src/main/de/l3s/boilerpipe/document/TextBlock.java src/main/de/l3s/boilerpipe/document/TextDocumentStatistics.java src/main/de/l3s/boilerpipe/document/TextDocument.java src/main/de/l3s/boilerpipe/estimators/SimpleEstimator.java src/main/de/l3s/boilerpipe/extractors/LargestContentExtractor.java src/main/de/l3s/boilerpipe/extractors/DefaultExtractor.java src/main/de/l3s/boilerpipe/extractors/NumWordsRulesExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingWithMinKWordsExtractor.java src/main/de/l3s/boilerpipe/extractors/ExtractorBase.java src/main/de/l3s/boilerpipe/extractors/ArticleSentencesExtractor.java src/main/de/l3s/boilerpipe/extractors/CommonExtractors.java src/main/de/l3s/boilerpipe/extractors/CanolaExtractor.java src/main/de/l3s/boilerpipe/extractors/ArticleExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingExtractor.java src/main/de/l3s/boilerpipe/filters/english/HeuristicFilterBase.java src/main/de/l3s/boilerpipe/filters/english/KeepLargestFulltextBlockFilter.java src/main/de/l3s/boilerpipe/filters/english/TerminatingBlocksFinder.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFilter.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFromEndFilter.java src/main/de/l3s/boilerpipe/filters/english/DensityRulesClassifier.java src/main/de/l3s/boilerpipe/filters/english/MinFulltextWordsFilter.java src/main/de/l3s/boilerpipe/filters/english/NumWordsRulesClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/SimpleBlockFusionProcessor.java src/main/de/l3s/boilerpipe/filters/heuristics/BlockProximityFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/KeepLargestBlockFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/DocumentTitleMatchClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/LabelFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/AddPrecedingLabelsFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ExpandTitleToContentFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ContentFusion.java src/main/de/l3s/boilerpipe/filters/simple/MinWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToBoilerplateFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToContentFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/MinClauseWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/BoilerplateBlockFilter.java src/main/de/l3s/boilerpipe/filters/simple/SplitParagraphBlocksFilter.java src/main/de/l3s/boilerpipe/filters/simple/MarkEverythingContentFilter.java src/main/de/l3s/boilerpipe/labels/DefaultLabels.java src/main/de/l3s/boilerpipe/labels/ConditionalLabelAction.java src/main/de/l3s/boilerpipe/labels/LabelAction.java src/main/de/l3s/boilerpipe/sax/BoilerpipeSAXInput.java src/main/de/l3s/boilerpipe/sax/HTMLHighlighter.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLContentHandler.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLParser.java src/main/de/l3s/boilerpipe/sax/TagActionMap.java src/main/de/l3s/boilerpipe/sax/InputSourceable.java src/main/de/l3s/boilerpipe/sax/HTMLDocument.java src/main/de/l3s/boilerpipe/sax/CommonTagActions.java src/main/de/l3s/boilerpipe/sax/DefaultTagActionMap.java src/main/de/l3s/boilerpipe/sax/HTMLFetcher.java src/main/de/l3s/boilerpipe/sax/TagAction.java src/main/de/l3s/boilerpipe/sax/MarkupTagAction.java src/main/de/l3s/boilerpipe/util/UnicodeTokenizer.java + native2ascii -encoding UTF8 src/main/de/l3s/boilerpipe/sax/CommonTagActions.java src/main/de/l3s/boilerpipe/sax/CommonTagActions.java + for s in src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeFilter.java src/main/de/l3s/boilerpipe/BoilerpipeExtractor.java src/main/de/l3s/boilerpipe/BoilerpipeProcessingException.java src/main/de/l3s/boilerpipe/conditions/TextBlockCondition.java src/main/de/l3s/boilerpipe/document/TextBlock.java src/main/de/l3s/boilerpipe/document/TextDocumentStatistics.java src/main/de/l3s/boilerpipe/document/TextDocument.java src/main/de/l3s/boilerpipe/estimators/SimpleEstimator.java src/main/de/l3s/boilerpipe/extractors/LargestContentExtractor.java src/main/de/l3s/boilerpipe/extractors/DefaultExtractor.java src/main/de/l3s/boilerpipe/extractors/NumWordsRulesExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingWithMinKWordsExtractor.java src/main/de/l3s/boilerpipe/extractors/ExtractorBase.java src/main/de/l3s/boilerpipe/extractors/ArticleSentencesExtractor.java src/main/de/l3s/boilerpipe/extractors/CommonExtractors.java src/main/de/l3s/boilerpipe/extractors/CanolaExtractor.java src/main/de/l3s/boilerpipe/extractors/ArticleExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingExtractor.java src/main/de/l3s/boilerpipe/filters/english/HeuristicFilterBase.java src/main/de/l3s/boilerpipe/filters/english/KeepLargestFulltextBlockFilter.java src/main/de/l3s/boilerpipe/filters/english/TerminatingBlocksFinder.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFilter.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFromEndFilter.java src/main/de/l3s/boilerpipe/filters/english/DensityRulesClassifier.java src/main/de/l3s/boilerpipe/filters/english/MinFulltextWordsFilter.java src/main/de/l3s/boilerpipe/filters/english/NumWordsRulesClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/SimpleBlockFusionProcessor.java src/main/de/l3s/boilerpipe/filters/heuristics/BlockProximityFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/KeepLargestBlockFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/DocumentTitleMatchClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/LabelFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/AddPrecedingLabelsFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ExpandTitleToContentFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ContentFusion.java src/main/de/l3s/boilerpipe/filters/simple/MinWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToBoilerplateFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToContentFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/MinClauseWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/BoilerplateBlockFilter.java src/main/de/l3s/boilerpipe/filters/simple/SplitParagraphBlocksFilter.java src/main/de/l3s/boilerpipe/filters/simple/MarkEverythingContentFilter.java src/main/de/l3s/boilerpipe/labels/DefaultLabels.java src/main/de/l3s/boilerpipe/labels/ConditionalLabelAction.java src/main/de/l3s/boilerpipe/labels/LabelAction.java src/main/de/l3s/boilerpipe/sax/BoilerpipeSAXInput.java src/main/de/l3s/boilerpipe/sax/HTMLHighlighter.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLContentHandler.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLParser.java src/main/de/l3s/boilerpipe/sax/TagActionMap.java src/main/de/l3s/boilerpipe/sax/InputSourceable.java src/main/de/l3s/boilerpipe/sax/HTMLDocument.java src/main/de/l3s/boilerpipe/sax/CommonTagActions.java src/main/de/l3s/boilerpipe/sax/DefaultTagActionMap.java src/main/de/l3s/boilerpipe/sax/HTMLFetcher.java src/main/de/l3s/boilerpipe/sax/TagAction.java src/main/de/l3s/boilerpipe/sax/MarkupTagAction.java src/main/de/l3s/boilerpipe/util/UnicodeTokenizer.java + native2ascii -encoding UTF8 src/main/de/l3s/boilerpipe/sax/DefaultTagActionMap.java src/main/de/l3s/boilerpipe/sax/DefaultTagActionMap.java + for s in src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeFilter.java src/main/de/l3s/boilerpipe/BoilerpipeExtractor.java src/main/de/l3s/boilerpipe/BoilerpipeProcessingException.java src/main/de/l3s/boilerpipe/conditions/TextBlockCondition.java src/main/de/l3s/boilerpipe/document/TextBlock.java src/main/de/l3s/boilerpipe/document/TextDocumentStatistics.java src/main/de/l3s/boilerpipe/document/TextDocument.java src/main/de/l3s/boilerpipe/estimators/SimpleEstimator.java src/main/de/l3s/boilerpipe/extractors/LargestContentExtractor.java src/main/de/l3s/boilerpipe/extractors/DefaultExtractor.java src/main/de/l3s/boilerpipe/extractors/NumWordsRulesExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingWithMinKWordsExtractor.java src/main/de/l3s/boilerpipe/extractors/ExtractorBase.java src/main/de/l3s/boilerpipe/extractors/ArticleSentencesExtractor.java src/main/de/l3s/boilerpipe/extractors/CommonExtractors.java src/main/de/l3s/boilerpipe/extractors/CanolaExtractor.java src/main/de/l3s/boilerpipe/extractors/ArticleExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingExtractor.java src/main/de/l3s/boilerpipe/filters/english/HeuristicFilterBase.java src/main/de/l3s/boilerpipe/filters/english/KeepLargestFulltextBlockFilter.java src/main/de/l3s/boilerpipe/filters/english/TerminatingBlocksFinder.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFilter.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFromEndFilter.java src/main/de/l3s/boilerpipe/filters/english/DensityRulesClassifier.java src/main/de/l3s/boilerpipe/filters/english/MinFulltextWordsFilter.java src/main/de/l3s/boilerpipe/filters/english/NumWordsRulesClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/SimpleBlockFusionProcessor.java src/main/de/l3s/boilerpipe/filters/heuristics/BlockProximityFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/KeepLargestBlockFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/DocumentTitleMatchClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/LabelFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/AddPrecedingLabelsFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ExpandTitleToContentFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ContentFusion.java src/main/de/l3s/boilerpipe/filters/simple/MinWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToBoilerplateFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToContentFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/MinClauseWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/BoilerplateBlockFilter.java src/main/de/l3s/boilerpipe/filters/simple/SplitParagraphBlocksFilter.java src/main/de/l3s/boilerpipe/filters/simple/MarkEverythingContentFilter.java src/main/de/l3s/boilerpipe/labels/DefaultLabels.java src/main/de/l3s/boilerpipe/labels/ConditionalLabelAction.java src/main/de/l3s/boilerpipe/labels/LabelAction.java src/main/de/l3s/boilerpipe/sax/BoilerpipeSAXInput.java src/main/de/l3s/boilerpipe/sax/HTMLHighlighter.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLContentHandler.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLParser.java src/main/de/l3s/boilerpipe/sax/TagActionMap.java src/main/de/l3s/boilerpipe/sax/InputSourceable.java src/main/de/l3s/boilerpipe/sax/HTMLDocument.java src/main/de/l3s/boilerpipe/sax/CommonTagActions.java src/main/de/l3s/boilerpipe/sax/DefaultTagActionMap.java src/main/de/l3s/boilerpipe/sax/HTMLFetcher.java src/main/de/l3s/boilerpipe/sax/TagAction.java src/main/de/l3s/boilerpipe/sax/MarkupTagAction.java src/main/de/l3s/boilerpipe/util/UnicodeTokenizer.java + native2ascii -encoding UTF8 src/main/de/l3s/boilerpipe/sax/HTMLFetcher.java src/main/de/l3s/boilerpipe/sax/HTMLFetcher.java + for s in src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeFilter.java src/main/de/l3s/boilerpipe/BoilerpipeExtractor.java src/main/de/l3s/boilerpipe/BoilerpipeProcessingException.java src/main/de/l3s/boilerpipe/conditions/TextBlockCondition.java src/main/de/l3s/boilerpipe/document/TextBlock.java src/main/de/l3s/boilerpipe/document/TextDocumentStatistics.java src/main/de/l3s/boilerpipe/document/TextDocument.java src/main/de/l3s/boilerpipe/estimators/SimpleEstimator.java src/main/de/l3s/boilerpipe/extractors/LargestContentExtractor.java src/main/de/l3s/boilerpipe/extractors/DefaultExtractor.java src/main/de/l3s/boilerpipe/extractors/NumWordsRulesExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingWithMinKWordsExtractor.java src/main/de/l3s/boilerpipe/extractors/ExtractorBase.java src/main/de/l3s/boilerpipe/extractors/ArticleSentencesExtractor.java src/main/de/l3s/boilerpipe/extractors/CommonExtractors.java src/main/de/l3s/boilerpipe/extractors/CanolaExtractor.java src/main/de/l3s/boilerpipe/extractors/ArticleExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingExtractor.java src/main/de/l3s/boilerpipe/filters/english/HeuristicFilterBase.java src/main/de/l3s/boilerpipe/filters/english/KeepLargestFulltextBlockFilter.java src/main/de/l3s/boilerpipe/filters/english/TerminatingBlocksFinder.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFilter.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFromEndFilter.java src/main/de/l3s/boilerpipe/filters/english/DensityRulesClassifier.java src/main/de/l3s/boilerpipe/filters/english/MinFulltextWordsFilter.java src/main/de/l3s/boilerpipe/filters/english/NumWordsRulesClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/SimpleBlockFusionProcessor.java src/main/de/l3s/boilerpipe/filters/heuristics/BlockProximityFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/KeepLargestBlockFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/DocumentTitleMatchClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/LabelFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/AddPrecedingLabelsFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ExpandTitleToContentFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ContentFusion.java src/main/de/l3s/boilerpipe/filters/simple/MinWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToBoilerplateFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToContentFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/MinClauseWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/BoilerplateBlockFilter.java src/main/de/l3s/boilerpipe/filters/simple/SplitParagraphBlocksFilter.java src/main/de/l3s/boilerpipe/filters/simple/MarkEverythingContentFilter.java src/main/de/l3s/boilerpipe/labels/DefaultLabels.java src/main/de/l3s/boilerpipe/labels/ConditionalLabelAction.java src/main/de/l3s/boilerpipe/labels/LabelAction.java src/main/de/l3s/boilerpipe/sax/BoilerpipeSAXInput.java src/main/de/l3s/boilerpipe/sax/HTMLHighlighter.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLContentHandler.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLParser.java src/main/de/l3s/boilerpipe/sax/TagActionMap.java src/main/de/l3s/boilerpipe/sax/InputSourceable.java src/main/de/l3s/boilerpipe/sax/HTMLDocument.java src/main/de/l3s/boilerpipe/sax/CommonTagActions.java src/main/de/l3s/boilerpipe/sax/DefaultTagActionMap.java src/main/de/l3s/boilerpipe/sax/HTMLFetcher.java src/main/de/l3s/boilerpipe/sax/TagAction.java src/main/de/l3s/boilerpipe/sax/MarkupTagAction.java src/main/de/l3s/boilerpipe/util/UnicodeTokenizer.java + native2ascii -encoding UTF8 src/main/de/l3s/boilerpipe/sax/TagAction.java src/main/de/l3s/boilerpipe/sax/TagAction.java + for s in src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeFilter.java src/main/de/l3s/boilerpipe/BoilerpipeExtractor.java src/main/de/l3s/boilerpipe/BoilerpipeProcessingException.java src/main/de/l3s/boilerpipe/conditions/TextBlockCondition.java src/main/de/l3s/boilerpipe/document/TextBlock.java src/main/de/l3s/boilerpipe/document/TextDocumentStatistics.java src/main/de/l3s/boilerpipe/document/TextDocument.java src/main/de/l3s/boilerpipe/estimators/SimpleEstimator.java src/main/de/l3s/boilerpipe/extractors/LargestContentExtractor.java src/main/de/l3s/boilerpipe/extractors/DefaultExtractor.java src/main/de/l3s/boilerpipe/extractors/NumWordsRulesExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingWithMinKWordsExtractor.java src/main/de/l3s/boilerpipe/extractors/ExtractorBase.java src/main/de/l3s/boilerpipe/extractors/ArticleSentencesExtractor.java src/main/de/l3s/boilerpipe/extractors/CommonExtractors.java src/main/de/l3s/boilerpipe/extractors/CanolaExtractor.java src/main/de/l3s/boilerpipe/extractors/ArticleExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingExtractor.java src/main/de/l3s/boilerpipe/filters/english/HeuristicFilterBase.java src/main/de/l3s/boilerpipe/filters/english/KeepLargestFulltextBlockFilter.java src/main/de/l3s/boilerpipe/filters/english/TerminatingBlocksFinder.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFilter.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFromEndFilter.java src/main/de/l3s/boilerpipe/filters/english/DensityRulesClassifier.java src/main/de/l3s/boilerpipe/filters/english/MinFulltextWordsFilter.java src/main/de/l3s/boilerpipe/filters/english/NumWordsRulesClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/SimpleBlockFusionProcessor.java src/main/de/l3s/boilerpipe/filters/heuristics/BlockProximityFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/KeepLargestBlockFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/DocumentTitleMatchClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/LabelFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/AddPrecedingLabelsFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ExpandTitleToContentFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ContentFusion.java src/main/de/l3s/boilerpipe/filters/simple/MinWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToBoilerplateFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToContentFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/MinClauseWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/BoilerplateBlockFilter.java src/main/de/l3s/boilerpipe/filters/simple/SplitParagraphBlocksFilter.java src/main/de/l3s/boilerpipe/filters/simple/MarkEverythingContentFilter.java src/main/de/l3s/boilerpipe/labels/DefaultLabels.java src/main/de/l3s/boilerpipe/labels/ConditionalLabelAction.java src/main/de/l3s/boilerpipe/labels/LabelAction.java src/main/de/l3s/boilerpipe/sax/BoilerpipeSAXInput.java src/main/de/l3s/boilerpipe/sax/HTMLHighlighter.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLContentHandler.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLParser.java src/main/de/l3s/boilerpipe/sax/TagActionMap.java src/main/de/l3s/boilerpipe/sax/InputSourceable.java src/main/de/l3s/boilerpipe/sax/HTMLDocument.java src/main/de/l3s/boilerpipe/sax/CommonTagActions.java src/main/de/l3s/boilerpipe/sax/DefaultTagActionMap.java src/main/de/l3s/boilerpipe/sax/HTMLFetcher.java src/main/de/l3s/boilerpipe/sax/TagAction.java src/main/de/l3s/boilerpipe/sax/MarkupTagAction.java src/main/de/l3s/boilerpipe/util/UnicodeTokenizer.java + native2ascii -encoding UTF8 src/main/de/l3s/boilerpipe/sax/MarkupTagAction.java src/main/de/l3s/boilerpipe/sax/MarkupTagAction.java + for s in src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeInput.java src/main/de/l3s/boilerpipe/BoilerpipeFilter.java src/main/de/l3s/boilerpipe/BoilerpipeExtractor.java src/main/de/l3s/boilerpipe/BoilerpipeProcessingException.java src/main/de/l3s/boilerpipe/conditions/TextBlockCondition.java src/main/de/l3s/boilerpipe/document/TextBlock.java src/main/de/l3s/boilerpipe/document/TextDocumentStatistics.java src/main/de/l3s/boilerpipe/document/TextDocument.java src/main/de/l3s/boilerpipe/estimators/SimpleEstimator.java src/main/de/l3s/boilerpipe/extractors/LargestContentExtractor.java src/main/de/l3s/boilerpipe/extractors/DefaultExtractor.java src/main/de/l3s/boilerpipe/extractors/NumWordsRulesExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingWithMinKWordsExtractor.java src/main/de/l3s/boilerpipe/extractors/ExtractorBase.java src/main/de/l3s/boilerpipe/extractors/ArticleSentencesExtractor.java src/main/de/l3s/boilerpipe/extractors/CommonExtractors.java src/main/de/l3s/boilerpipe/extractors/CanolaExtractor.java src/main/de/l3s/boilerpipe/extractors/ArticleExtractor.java src/main/de/l3s/boilerpipe/extractors/KeepEverythingExtractor.java src/main/de/l3s/boilerpipe/filters/english/HeuristicFilterBase.java src/main/de/l3s/boilerpipe/filters/english/KeepLargestFulltextBlockFilter.java src/main/de/l3s/boilerpipe/filters/english/TerminatingBlocksFinder.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFilter.java src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFromEndFilter.java src/main/de/l3s/boilerpipe/filters/english/DensityRulesClassifier.java src/main/de/l3s/boilerpipe/filters/english/MinFulltextWordsFilter.java src/main/de/l3s/boilerpipe/filters/english/NumWordsRulesClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/SimpleBlockFusionProcessor.java src/main/de/l3s/boilerpipe/filters/heuristics/BlockProximityFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/KeepLargestBlockFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/DocumentTitleMatchClassifier.java src/main/de/l3s/boilerpipe/filters/heuristics/LabelFusion.java src/main/de/l3s/boilerpipe/filters/heuristics/AddPrecedingLabelsFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ExpandTitleToContentFilter.java src/main/de/l3s/boilerpipe/filters/heuristics/ContentFusion.java src/main/de/l3s/boilerpipe/filters/simple/MinWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToBoilerplateFilter.java src/main/de/l3s/boilerpipe/filters/simple/LabelToContentFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/InvertedFilter.java src/main/de/l3s/boilerpipe/filters/simple/MinClauseWordsFilter.java src/main/de/l3s/boilerpipe/filters/simple/BoilerplateBlockFilter.java src/main/de/l3s/boilerpipe/filters/simple/SplitParagraphBlocksFilter.java src/main/de/l3s/boilerpipe/filters/simple/MarkEverythingContentFilter.java src/main/de/l3s/boilerpipe/labels/DefaultLabels.java src/main/de/l3s/boilerpipe/labels/ConditionalLabelAction.java src/main/de/l3s/boilerpipe/labels/LabelAction.java src/main/de/l3s/boilerpipe/sax/BoilerpipeSAXInput.java src/main/de/l3s/boilerpipe/sax/HTMLHighlighter.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLContentHandler.java src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLParser.java src/main/de/l3s/boilerpipe/sax/TagActionMap.java src/main/de/l3s/boilerpipe/sax/InputSourceable.java src/main/de/l3s/boilerpipe/sax/HTMLDocument.java src/main/de/l3s/boilerpipe/sax/CommonTagActions.java src/main/de/l3s/boilerpipe/sax/DefaultTagActionMap.java src/main/de/l3s/boilerpipe/sax/HTMLFetcher.java src/main/de/l3s/boilerpipe/sax/TagAction.java src/main/de/l3s/boilerpipe/sax/MarkupTagAction.java src/main/de/l3s/boilerpipe/util/UnicodeTokenizer.java + native2ascii -encoding UTF8 src/main/de/l3s/boilerpipe/util/UnicodeTokenizer.java src/main/de/l3s/boilerpipe/util/UnicodeTokenizer.java + exit 0 Executing(%build): /bin/sh -e /usr/src/tmp/rpm-tmp.49146 + umask 022 + /bin/mkdir -p /usr/src/RPM/BUILD + cd /usr/src/RPM/BUILD + cd boilerpipe-1.2.0 + ant -Dapp.javaversion=1.6 Buildfile: /usr/src/RPM/BUILD/boilerpipe-1.2.0/build.xml clean: [mkdir] Created dir: /usr/src/RPM/BUILD/boilerpipe-1.2.0/javadoc/1.2 init: [mkdir] Created dir: /usr/src/RPM/BUILD/boilerpipe-1.2.0/build [mkdir] Created dir: /usr/src/RPM/BUILD/boilerpipe-1.2.0/build/main [mkdir] Created dir: /usr/src/RPM/BUILD/boilerpipe-1.2.0/build/demo [mkdir] Created dir: /usr/src/RPM/BUILD/boilerpipe-1.2.0/dist javadoc: [javadoc] Generating Javadoc [javadoc] Javadoc execution [javadoc] Loading source files for package de.l3s.boilerpipe... [javadoc] Loading source files for package de.l3s.boilerpipe.conditions... [javadoc] Loading source files for package de.l3s.boilerpipe.document... [javadoc] Loading source files for package de.l3s.boilerpipe.estimators... [javadoc] Loading source files for package de.l3s.boilerpipe.extractors... [javadoc] Loading source files for package de.l3s.boilerpipe.filters.english... [javadoc] Loading source files for package de.l3s.boilerpipe.filters.heuristics... [javadoc] Loading source files for package de.l3s.boilerpipe.filters.simple... [javadoc] Loading source files for package de.l3s.boilerpipe.labels... [javadoc] Loading source files for package de.l3s.boilerpipe.sax... [javadoc] Loading source files for package de.l3s.boilerpipe.util... [javadoc] Constructing Javadoc information... [javadoc] Standard Doclet version 11.0.9-ea [javadoc] Building tree for all the packages and classes... [javadoc] /usr/src/RPM/BUILD/boilerpipe-1.2.0/src/main/de/l3s/boilerpipe/BoilerpipeFilter.java:36: warning: no description for @throws [javadoc] * @throws BoilerpipeProcessingException [javadoc] ^ [javadoc] /usr/src/RPM/BUILD/boilerpipe-1.2.0/src/main/de/l3s/boilerpipe/BoilerpipeExtractor.java:21: warning: no description for @throws [javadoc] * @throws BoilerpipeProcessingException [javadoc] ^ [javadoc] /usr/src/RPM/BUILD/boilerpipe-1.2.0/src/main/de/l3s/boilerpipe/BoilerpipeExtractor.java:33: warning: no description for @throws [javadoc] * @throws BoilerpipeProcessingException [javadoc] ^ [javadoc] /usr/src/RPM/BUILD/boilerpipe-1.2.0/src/main/de/l3s/boilerpipe/BoilerpipeExtractor.java:44: warning: no description for @throws [javadoc] * @throws BoilerpipeProcessingException [javadoc] ^ [javadoc] /usr/src/RPM/BUILD/boilerpipe-1.2.0/src/main/de/l3s/boilerpipe/BoilerpipeExtractor.java:54: warning: no description for @throws [javadoc] * @throws BoilerpipeProcessingException [javadoc] ^ [javadoc] /usr/src/RPM/BUILD/boilerpipe-1.2.0/src/main/de/l3s/boilerpipe/BoilerpipeInput.java:32: warning: no description for @throws [javadoc] * @throws BoilerpipeProcessingException [javadoc] ^ [javadoc] /usr/src/RPM/BUILD/boilerpipe-1.2.0/src/main/de/l3s/boilerpipe/conditions/TextBlockCondition.java:33: warning: no description for @param [javadoc] * @param tb [javadoc] ^ [javadoc] /usr/src/RPM/BUILD/boilerpipe-1.2.0/src/main/de/l3s/boilerpipe/conditions/TextBlockCondition.java:34: error: malformed HTML [javadoc] * @return iff the condition is met. [javadoc] ^ [javadoc] /usr/src/RPM/BUILD/boilerpipe-1.2.0/src/main/de/l3s/boilerpipe/document/TextBlock.java:252: warning: no description for @return [javadoc] * @return [javadoc] ^ [javadoc] /usr/src/RPM/BUILD/boilerpipe-1.2.0/src/main/de/l3s/boilerpipe/document/TextDocument.java:78: warning: no description for @param [javadoc] * @param title [javadoc] ^ [javadoc] /usr/src/RPM/BUILD/boilerpipe-1.2.0/src/main/de/l3s/boilerpipe/estimators/SimpleEstimator.java:46: warning: no description for @param [javadoc] * @param dsBefore [javadoc] ^ [javadoc] /usr/src/RPM/BUILD/boilerpipe-1.2.0/src/main/de/l3s/boilerpipe/estimators/SimpleEstimator.java:47: warning: no description for @param [javadoc] * @param dsAfter [javadoc] ^ [javadoc] /usr/src/RPM/BUILD/boilerpipe-1.2.0/src/main/de/l3s/boilerpipe/extractors/ExtractorBase.java:47: warning: no description for @throws [javadoc] * @throws BoilerpipeProcessingException [javadoc] ^ [javadoc] /usr/src/RPM/BUILD/boilerpipe-1.2.0/src/main/de/l3s/boilerpipe/extractors/ExtractorBase.java:64: warning: no description for @throws [javadoc] * @throws BoilerpipeProcessingException [javadoc] ^ [javadoc] /usr/src/RPM/BUILD/boilerpipe-1.2.0/src/main/de/l3s/boilerpipe/extractors/ExtractorBase.java:83: warning: no description for @throws [javadoc] * @throws BoilerpipeProcessingException [javadoc] ^ [javadoc] /usr/src/RPM/BUILD/boilerpipe-1.2.0/src/main/de/l3s/boilerpipe/extractors/ExtractorBase.java:98: warning: no description for @throws [javadoc] * @throws BoilerpipeProcessingException [javadoc] ^ [javadoc] /usr/src/RPM/BUILD/boilerpipe-1.2.0/src/main/de/l3s/boilerpipe/extractors/ExtractorBase.java:109: warning: no description for @throws [javadoc] * @throws BoilerpipeProcessingException [javadoc] ^ [javadoc] /usr/src/RPM/BUILD/boilerpipe-1.2.0/src/main/de/l3s/boilerpipe/extractors/ArticleExtractor.java:43: warning: no @return [javadoc] public static ArticleExtractor getInstance() { [javadoc] ^ [javadoc] /usr/src/RPM/BUILD/boilerpipe-1.2.0/src/main/de/l3s/boilerpipe/extractors/ArticleSentencesExtractor.java:36: warning: no @return [javadoc] public static ArticleSentencesExtractor getInstance() { [javadoc] ^ [javadoc] /usr/src/RPM/BUILD/boilerpipe-1.2.0/src/main/de/l3s/boilerpipe/extractors/CanolaExtractor.java:43: warning: no @return [javadoc] public static CanolaExtractor getInstance() { [javadoc] ^ [javadoc] /usr/src/RPM/BUILD/boilerpipe-1.2.0/src/main/de/l3s/boilerpipe/extractors/DefaultExtractor.java:37: warning: no @return [javadoc] public static DefaultExtractor getInstance() { [javadoc] ^ [javadoc] /usr/src/RPM/BUILD/boilerpipe-1.2.0/src/main/de/l3s/boilerpipe/extractors/LargestContentExtractor.java:42: warning: no @return [javadoc] public static LargestContentExtractor getInstance() { [javadoc] ^ [javadoc] /usr/src/RPM/BUILD/boilerpipe-1.2.0/src/main/de/l3s/boilerpipe/extractors/NumWordsRulesExtractor.java:36: warning: no @return [javadoc] public static NumWordsRulesExtractor getInstance() { [javadoc] ^ [javadoc] /usr/src/RPM/BUILD/boilerpipe-1.2.0/src/main/de/l3s/boilerpipe/filters/english/DensityRulesClassifier.java:43: warning: no @return [javadoc] public static DensityRulesClassifier getInstance() { [javadoc] ^ [javadoc] /usr/src/RPM/BUILD/boilerpipe-1.2.0/src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFilter.java:47: warning: no @return [javadoc] public static IgnoreBlocksAfterContentFilter getDefaultInstance() { [javadoc] ^ [javadoc] /usr/src/RPM/BUILD/boilerpipe-1.2.0/src/main/de/l3s/boilerpipe/filters/english/NumWordsRulesClassifier.java:42: warning: no @return [javadoc] public static NumWordsRulesClassifier getInstance() { [javadoc] ^ [javadoc] /usr/src/RPM/BUILD/boilerpipe-1.2.0/src/main/de/l3s/boilerpipe/filters/english/TerminatingBlocksFinder.java:40: warning: no @return [javadoc] public static TerminatingBlocksFinder getInstance() { [javadoc] ^ [javadoc] /usr/src/RPM/BUILD/boilerpipe-1.2.0/src/main/de/l3s/boilerpipe/filters/heuristics/AddPrecedingLabelsFilter.java:44: error: @param name not found [javadoc] * @param maxBlocksDistance The maximum distance in blocks. [javadoc] ^ [javadoc] /usr/src/RPM/BUILD/boilerpipe-1.2.0/src/main/de/l3s/boilerpipe/filters/heuristics/AddPrecedingLabelsFilter.java:45: error: @param name not found [javadoc] * @param contentOnly [javadoc] ^ [javadoc] /usr/src/RPM/BUILD/boilerpipe-1.2.0/src/main/de/l3s/boilerpipe/filters/heuristics/AddPrecedingLabelsFilter.java:45: warning: no description for @param [javadoc] * @param contentOnly [javadoc] ^ [javadoc] /usr/src/RPM/BUILD/boilerpipe-1.2.0/src/main/de/l3s/boilerpipe/filters/heuristics/AddPrecedingLabelsFilter.java:47: warning: no @param for labelPrefix [javadoc] public AddPrecedingLabelsFilter(final String labelPrefix) { [javadoc] ^ [javadoc] /usr/src/RPM/BUILD/boilerpipe-1.2.0/src/main/de/l3s/boilerpipe/filters/heuristics/BlockProximityFusion.java:55: warning: no description for @param [javadoc] * @param contentOnly [javadoc] ^ [javadoc] /usr/src/RPM/BUILD/boilerpipe-1.2.0/src/main/de/l3s/boilerpipe/filters/heuristics/BlockProximityFusion.java:57: warning: no @param for sameTagLevelOnly [javadoc] public BlockProximityFusion(final int maxBlocksDistance, [javadoc] ^ [javadoc] /usr/src/RPM/BUILD/boilerpipe-1.2.0/src/main/de/l3s/boilerpipe/filters/heuristics/ExpandTitleToContentFilter.java:40: warning: no @return [javadoc] public static ExpandTitleToContentFilter getInstance() { [javadoc] ^ [javadoc] /usr/src/RPM/BUILD/boilerpipe-1.2.0/src/main/de/l3s/boilerpipe/filters/heuristics/LabelFusion.java:45: error: @param name not found [javadoc] * @param maxBlocksDistance The maximum distance in blocks. [javadoc] ^ [javadoc] /usr/src/RPM/BUILD/boilerpipe-1.2.0/src/main/de/l3s/boilerpipe/filters/heuristics/LabelFusion.java:46: error: @param name not found [javadoc] * @param contentOnly [javadoc] ^ [javadoc] /usr/src/RPM/BUILD/boilerpipe-1.2.0/src/main/de/l3s/boilerpipe/filters/heuristics/LabelFusion.java:46: warning: no description for @param [javadoc] * @param contentOnly [javadoc] ^ [javadoc] /usr/src/RPM/BUILD/boilerpipe-1.2.0/src/main/de/l3s/boilerpipe/filters/heuristics/LabelFusion.java:48: warning: no @param for labelPrefix [javadoc] public LabelFusion(final String labelPrefix) { [javadoc] ^ [javadoc] /usr/src/RPM/BUILD/boilerpipe-1.2.0/src/main/de/l3s/boilerpipe/filters/heuristics/SimpleBlockFusionProcessor.java:39: warning: no @return [javadoc] public static SimpleBlockFusionProcessor getInstance() { [javadoc] ^ [javadoc] /usr/src/RPM/BUILD/boilerpipe-1.2.0/src/main/de/l3s/boilerpipe/filters/simple/BoilerplateBlockFilter.java:39: warning: no @return [javadoc] public static BoilerplateBlockFilter getInstance() { [javadoc] ^ [javadoc] /usr/src/RPM/BUILD/boilerpipe-1.2.0/src/main/de/l3s/boilerpipe/filters/simple/SplitParagraphBlocksFilter.java:45: warning: no @return [javadoc] public static SplitParagraphBlocksFilter getInstance() { [javadoc] ^ [javadoc] /usr/src/RPM/BUILD/boilerpipe-1.2.0/src/main/de/l3s/boilerpipe/sax/BoilerpipeHTMLParser.java:47: warning: no description for @param [javadoc] * @param contentHandler [javadoc] ^ [javadoc] /usr/src/RPM/BUILD/boilerpipe-1.2.0/src/main/de/l3s/boilerpipe/sax/BoilerpipeSAXInput.java:40: warning: no description for @param [javadoc] * @param is [javadoc] ^ [javadoc] /usr/src/RPM/BUILD/boilerpipe-1.2.0/src/main/de/l3s/boilerpipe/sax/BoilerpipeSAXInput.java:41: warning: no description for @throws [javadoc] * @throws SAXException [javadoc] ^ [javadoc] /usr/src/RPM/BUILD/boilerpipe-1.2.0/src/main/de/l3s/boilerpipe/sax/BoilerpipeSAXInput.java:59: warning: no description for @throws [javadoc] * @throws BoilerpipeProcessingException [javadoc] ^ [javadoc] /usr/src/RPM/BUILD/boilerpipe-1.2.0/src/main/de/l3s/boilerpipe/sax/HTMLFetcher.java:27: warning: no description for @param [javadoc] * @param url [javadoc] ^ [javadoc] /usr/src/RPM/BUILD/boilerpipe-1.2.0/src/main/de/l3s/boilerpipe/sax/HTMLFetcher.java:28: warning: no description for @return [javadoc] * @return [javadoc] ^ [javadoc] /usr/src/RPM/BUILD/boilerpipe-1.2.0/src/main/de/l3s/boilerpipe/sax/HTMLFetcher.java:29: warning: no description for @throws [javadoc] * @throws IOException [javadoc] ^ [javadoc] /usr/src/RPM/BUILD/boilerpipe-1.2.0/src/main/de/l3s/boilerpipe/sax/HTMLHighlighter.java:54: warning: no @return [javadoc] public static HTMLHighlighter newHighlightingInstance() { [javadoc] ^ [javadoc] /usr/src/RPM/BUILD/boilerpipe-1.2.0/src/main/de/l3s/boilerpipe/sax/HTMLHighlighter.java:62: warning: no @return [javadoc] public static HTMLHighlighter newExtractingInstance() { [javadoc] ^ [javadoc] /usr/src/RPM/BUILD/boilerpipe-1.2.0/src/main/de/l3s/boilerpipe/sax/HTMLHighlighter.java:88: warning: no description for @throws [javadoc] * @throws BoilerpipeProcessingException [javadoc] ^ [javadoc] /usr/src/RPM/BUILD/boilerpipe-1.2.0/src/main/de/l3s/boilerpipe/sax/HTMLHighlighter.java:90: warning: no @return [javadoc] public String process(final TextDocument doc, final String origHTML) [javadoc] ^ [javadoc] /usr/src/RPM/BUILD/boilerpipe-1.2.0/src/main/de/l3s/boilerpipe/sax/HTMLHighlighter.java:103: warning: no description for @throws [javadoc] * @throws BoilerpipeProcessingException [javadoc] ^ [javadoc] /usr/src/RPM/BUILD/boilerpipe-1.2.0/src/main/de/l3s/boilerpipe/sax/HTMLHighlighter.java:105: warning: no @return [javadoc] public String process(final TextDocument doc, final InputSource is) [javadoc] ^ [javadoc] /usr/src/RPM/BUILD/boilerpipe-1.2.0/src/main/de/l3s/boilerpipe/sax/HTMLHighlighter.java:162: warning: no @return [javadoc] public boolean isOutputHighlightOnly() { [javadoc] ^ [javadoc] /usr/src/RPM/BUILD/boilerpipe-1.2.0/src/main/de/l3s/boilerpipe/sax/HTMLHighlighter.java:170: warning: no @param for outputHighlightOnly [javadoc] public void setOutputHighlightOnly(boolean outputHighlightOnly) { [javadoc] ^ [javadoc] /usr/src/RPM/BUILD/boilerpipe-1.2.0/src/main/de/l3s/boilerpipe/sax/HTMLHighlighter.java:181: warning: no @return [javadoc] public String getExtraStyleSheet() { [javadoc] ^ [javadoc] /usr/src/RPM/BUILD/boilerpipe-1.2.0/src/main/de/l3s/boilerpipe/sax/HTMLHighlighter.java:203: error: invalid entity &qupt; [javadoc] * <span class=&qupt;x-boilerpipe-mark1"> [javadoc] ^ [javadoc] /usr/src/RPM/BUILD/boilerpipe-1.2.0/src/main/de/l3s/boilerpipe/sax/HTMLHighlighter.java:205: warning: no @return [javadoc] public String getPreHighlight() { [javadoc] ^ [javadoc] /usr/src/RPM/BUILD/boilerpipe-1.2.0/src/main/de/l3s/boilerpipe/sax/HTMLHighlighter.java:215: warning: no @param for preHighlight [javadoc] public void setPreHighlight(String preHighlight) { [javadoc] ^ [javadoc] /usr/src/RPM/BUILD/boilerpipe-1.2.0/src/main/de/l3s/boilerpipe/sax/HTMLHighlighter.java:225: warning: no @return [javadoc] public String getPostHighlight() { [javadoc] ^ [javadoc] /usr/src/RPM/BUILD/boilerpipe-1.2.0/src/main/de/l3s/boilerpipe/sax/HTMLHighlighter.java:234: warning: no @param for postHighlight [javadoc] public void setPostHighlight(String postHighlight) { [javadoc] ^ [javadoc] Building index for all the packages and classes... [javadoc] Building index for all classes... [javadoc] Building index for all classes... [javadoc] Generating /usr/src/RPM/BUILD/boilerpipe-1.2.0/javadoc/1.2/help-doc.html... [javadoc] 6 errors [javadoc] 56 warnings compile: [javac] /usr/src/RPM/BUILD/boilerpipe-1.2.0/build.xml:93: warning: 'includeantruntime' was not set, defaulting to build.sysclasspath=last; set to false for repeatable builds [javac] Compiling 62 source files to /usr/src/RPM/BUILD/boilerpipe-1.2.0/build/main [javac] warning: [options] bootstrap class path not set in conjunction with -source 6 [javac] warning: [options] source value 6 is obsolete and will be removed in a future release [javac] warning: [options] target value 1.6 is obsolete and will be removed in a future release [javac] warning: [options] To suppress warnings about obsolete options, use -Xlint:-options. [javac] 4 warnings [javac] /usr/src/RPM/BUILD/boilerpipe-1.2.0/build.xml:94: warning: 'includeantruntime' was not set, defaulting to build.sysclasspath=last; set to false for repeatable builds [javac] Compiling 3 source files to /usr/src/RPM/BUILD/boilerpipe-1.2.0/build/demo [javac] warning: [options] bootstrap class path not set in conjunction with -source 6 [javac] warning: [options] source value 6 is obsolete and will be removed in a future release [javac] warning: [options] target value 1.6 is obsolete and will be removed in a future release [javac] warning: [options] To suppress warnings about obsolete options, use -Xlint:-options. [javac] 4 warnings jars: [jar] Building jar: /usr/src/RPM/BUILD/boilerpipe-1.2.0/dist/boilerpipe-1.2.0.jar [jar] Building jar: /usr/src/RPM/BUILD/boilerpipe-1.2.0/dist/boilerpipe-demo-1.2.0.jar [jar] Building jar: /usr/src/RPM/BUILD/boilerpipe-1.2.0/dist/boilerpipe-javadoc-1.2.0.jar [jar] Building jar: /usr/src/RPM/BUILD/boilerpipe-1.2.0/dist/boilerpipe-sources-1.2.0.jar dist: [tar] Building tar: /usr/src/RPM/BUILD/boilerpipe-1.2.0/dist/boilerpipe-1.2.0-bin.tar.gz [tar] Entry: boilerpipe-1.2.0/javadoc/1.2/de/l3s/boilerpipe/extractors/class-use/KeepEverythingWithMinKWordsExtractor.html longer than 100 characters. [tar] Resulting tar file can only be processed successfully by GNU compatible tar commands [tar] Entry: boilerpipe-1.2.0/javadoc/1.2/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFromEndFilter.html longer than 100 characters. [tar] Entry: boilerpipe-1.2.0/javadoc/1.2/de/l3s/boilerpipe/filters/english/class-use/DensityRulesClassifier.html longer than 100 characters. [tar] Entry: boilerpipe-1.2.0/javadoc/1.2/de/l3s/boilerpipe/filters/english/class-use/IgnoreBlocksAfterContentFilter.html longer than 100 characters. [tar] Entry: boilerpipe-1.2.0/javadoc/1.2/de/l3s/boilerpipe/filters/english/class-use/IgnoreBlocksAfterContentFromEndFilter.html longer than 100 characters. [tar] Entry: boilerpipe-1.2.0/javadoc/1.2/de/l3s/boilerpipe/filters/english/class-use/KeepLargestFulltextBlockFilter.html longer than 100 characters. [tar] Entry: boilerpipe-1.2.0/javadoc/1.2/de/l3s/boilerpipe/filters/english/class-use/MinFulltextWordsFilter.html longer than 100 characters. [tar] Entry: boilerpipe-1.2.0/javadoc/1.2/de/l3s/boilerpipe/filters/english/class-use/NumWordsRulesClassifier.html longer than 100 characters. [tar] Entry: boilerpipe-1.2.0/javadoc/1.2/de/l3s/boilerpipe/filters/english/class-use/TerminatingBlocksFinder.html longer than 100 characters. [tar] Entry: boilerpipe-1.2.0/javadoc/1.2/de/l3s/boilerpipe/filters/heuristics/class-use/AddPrecedingLabelsFilter.html longer than 100 characters. [tar] Entry: boilerpipe-1.2.0/javadoc/1.2/de/l3s/boilerpipe/filters/heuristics/class-use/ArticleMetadataFilter.html longer than 100 characters. [tar] Entry: boilerpipe-1.2.0/javadoc/1.2/de/l3s/boilerpipe/filters/heuristics/class-use/BlockProximityFusion.html longer than 100 characters. [tar] Entry: boilerpipe-1.2.0/javadoc/1.2/de/l3s/boilerpipe/filters/heuristics/class-use/DocumentTitleMatchClassifier.html longer than 100 characters. [tar] Entry: boilerpipe-1.2.0/javadoc/1.2/de/l3s/boilerpipe/filters/heuristics/class-use/ExpandTitleToContentFilter.html longer than 100 characters. [tar] Entry: boilerpipe-1.2.0/javadoc/1.2/de/l3s/boilerpipe/filters/heuristics/class-use/KeepLargestBlockFilter.html longer than 100 characters. [tar] Entry: boilerpipe-1.2.0/javadoc/1.2/de/l3s/boilerpipe/filters/heuristics/class-use/SimpleBlockFusionProcessor.html longer than 100 characters. [tar] Entry: boilerpipe-1.2.0/javadoc/1.2/de/l3s/boilerpipe/filters/simple/class-use/LabelToBoilerplateFilter.html longer than 100 characters. [tar] Entry: boilerpipe-1.2.0/javadoc/1.2/de/l3s/boilerpipe/filters/simple/class-use/MarkEverythingContentFilter.html longer than 100 characters. [tar] Entry: boilerpipe-1.2.0/javadoc/1.2/de/l3s/boilerpipe/filters/simple/class-use/SplitParagraphBlocksFilter.html longer than 100 characters. [tar] Entry: boilerpipe-1.2.0/javadoc/1.2/de/l3s/boilerpipe/filters/simple/class-use/SurroundingToContentFilter.html longer than 100 characters. [tar] Entry: boilerpipe-1.2.0/javadoc/1.2/de/l3s/boilerpipe/sax/class-use/CommonTagActions.BlockTagLabelAction.html longer than 100 characters. [tar] Entry: boilerpipe-1.2.0/javadoc/1.2/de/l3s/boilerpipe/sax/class-use/CommonTagActions.InlineTagLabelAction.html longer than 100 characters. [tar] Building tar: /usr/src/RPM/BUILD/boilerpipe-1.2.0/dist/boilerpipe-1.2.0-src.tar.gz [tar] Entry: boilerpipe-1.2.0/src/main/de/l3s/boilerpipe/filters/english/IgnoreBlocksAfterContentFromEndFilter.java longer than 100 characters. [tar] Resulting tar file can only be processed successfully by GNU compatible tar commands BUILD SUCCESSFUL Total time: 5 seconds + exit 0 Executing(%install): /bin/sh -e /usr/src/tmp/rpm-tmp.20975 + umask 022 + /bin/mkdir -p /usr/src/RPM/BUILD + cd /usr/src/RPM/BUILD + /bin/chmod -Rf u+rwX -- /usr/src/tmp/boilerpipe-buildroot + : + /bin/rm -rf -- /usr/src/tmp/boilerpipe-buildroot + cd boilerpipe-1.2.0 + /usr/bin/python3 /usr/share/java-utils/mvn_artifact.py pom.xml dist/boilerpipe-1.2.0.jar + /usr/bin/python3 /usr/share/java-utils/mvn_file.py de.l3s.boilerpipe:boilerpipe boilerpipe + xmvn-install -R .xmvn-reactor -n boilerpipe -d /usr/src/tmp/boilerpipe-buildroot [INFO] Installing artifact de.l3s.boilerpipe:boilerpipe:pom:1.2.0 [INFO] Installing artifact de.l3s.boilerpipe:boilerpipe:jar:1.2.0 [INFO] Installation successful + jdir=javadoc/1.2 + /bin/mkdir -p /usr/src/tmp/boilerpipe-buildroot/usr/share/license + '[' -d javadoc/1.2 ']' + install -dm755 /usr/src/tmp/boilerpipe-buildroot/usr/share/javadoc/boilerpipe + cp -pr javadoc/1.2/allclasses-index.html javadoc/1.2/allclasses.html javadoc/1.2/allpackages-index.html javadoc/1.2/constant-values.html javadoc/1.2/de javadoc/1.2/deprecated-list.html javadoc/1.2/element-list javadoc/1.2/help-doc.html javadoc/1.2/index-all.html javadoc/1.2/index.html javadoc/1.2/jquery javadoc/1.2/member-search-index.js javadoc/1.2/member-search-index.zip javadoc/1.2/overview-summary.html javadoc/1.2/overview-tree.html javadoc/1.2/package-search-index.js javadoc/1.2/package-search-index.zip javadoc/1.2/resources javadoc/1.2/script.js javadoc/1.2/search.js javadoc/1.2/serialized-form.html javadoc/1.2/stylesheet.css javadoc/1.2/type-search-index.js javadoc/1.2/type-search-index.zip /usr/src/tmp/boilerpipe-buildroot/usr/share/javadoc/boilerpipe + echo /usr/share/javadoc/boilerpipe + install -pm 644 dist/boilerpipe-demo-1.2.0.jar /usr/src/tmp/boilerpipe-buildroot/usr/share/java/boilerpipe-demo.jar + /usr/lib/rpm/brp-alt Cleaning files in /usr/src/tmp/boilerpipe-buildroot (auto) Verifying and fixing files in /usr/src/tmp/boilerpipe-buildroot (binconfig,pkgconfig,libtool,desktop) Checking contents of files in /usr/src/tmp/boilerpipe-buildroot/ (default) Compressing files in /usr/src/tmp/boilerpipe-buildroot (auto) Verifying ELF objects in /usr/src/tmp/boilerpipe-buildroot (arch=normal,fhs=normal,lfs=relaxed,lint=relaxed,rpath=normal,stack=normal,textrel=normal,unresolved=normal) Hardlinking identical .pyc and .pyo files Processing files: boilerpipe-1.2.0-alt1_13jpp8 Executing(%doc): /bin/sh -e /usr/src/tmp/rpm-tmp.52363 + umask 022 + /bin/mkdir -p /usr/src/RPM/BUILD + cd /usr/src/RPM/BUILD + cd boilerpipe-1.2.0 + DOCDIR=/usr/src/tmp/boilerpipe-buildroot/usr/share/doc/boilerpipe-1.2.0 + export DOCDIR + rm -rf /usr/src/tmp/boilerpipe-buildroot/usr/share/doc/boilerpipe-1.2.0 + /bin/mkdir -p /usr/src/tmp/boilerpipe-buildroot/usr/share/doc/boilerpipe-1.2.0 + cp -prL --no-dereference LICENSE.txt NOTICE.txt /usr/src/tmp/boilerpipe-buildroot/usr/share/doc/boilerpipe-1.2.0 + chmod -R go-w /usr/src/tmp/boilerpipe-buildroot/usr/share/doc/boilerpipe-1.2.0 + chmod -R a+rX /usr/src/tmp/boilerpipe-buildroot/usr/share/doc/boilerpipe-1.2.0 + exit 0 Finding Provides (using /usr/lib/rpm/find-provides) Executing: /bin/sh -e /usr/src/tmp/rpm-tmp.ujeery find-provides: running scripts (alternatives,debuginfo,lib,maven,osgi-fc,pam,perl,pkgconfig,python,shell) [INFO maven.prov] input: ['/usr/src/tmp/boilerpipe-buildroot/usr/share/maven-metadata/boilerpipe.xml'] [INFO maven.prov] mvn(de.l3s.boilerpipe:boilerpipe) = 1.2.0, mvn(de.l3s.boilerpipe:boilerpipe:pom:) = 1.2.0 [INFO osgi.prov] input: ['/usr/src/tmp/boilerpipe-buildroot/usr/share/java/boilerpipe-demo.jar', '/usr/src/tmp/boilerpipe-buildroot/usr/share/java/boilerpipe.jar'] Finding Requires (using /usr/lib/rpm/find-requires) Executing: /bin/sh -e /usr/src/tmp/rpm-tmp.46Afix find-requires: running scripts (cpp,debuginfo,files,javadoc,lib,maven,osgi-fc,pam,perl,pkgconfig,pkgconfiglib,python,rpmlib,shebang,shell,static,symlinks,systemd-services) [INFO maven.req] input: ['/usr/src/tmp/boilerpipe-buildroot/usr/share/maven-metadata/boilerpipe.xml'] [INFO maven.req] javapackages-filesystem, mvn(net.sourceforge.nekohtml:nekohtml) [INFO osgi.req] input: ['/usr/src/tmp/boilerpipe-buildroot/usr/share/java/boilerpipe-demo.jar', '/usr/src/tmp/boilerpipe-buildroot/usr/share/java/boilerpipe.jar'] Provides: mvn(de.l3s.boilerpipe:boilerpipe) = 1.2.0, mvn(de.l3s.boilerpipe:boilerpipe:pom:) = 1.2.0 Requires: javapackages-filesystem, mvn(net.sourceforge.nekohtml:nekohtml) Processing files: boilerpipe-javadoc-1.2.0-alt1_13jpp8 Executing(%doc): /bin/sh -e /usr/src/tmp/rpm-tmp.68884 + umask 022 + /bin/mkdir -p /usr/src/RPM/BUILD + cd /usr/src/RPM/BUILD + cd boilerpipe-1.2.0 + DOCDIR=/usr/src/tmp/boilerpipe-buildroot/usr/share/doc/boilerpipe-javadoc-1.2.0 + export DOCDIR + rm -rf /usr/src/tmp/boilerpipe-buildroot/usr/share/doc/boilerpipe-javadoc-1.2.0 + /bin/mkdir -p /usr/src/tmp/boilerpipe-buildroot/usr/share/doc/boilerpipe-javadoc-1.2.0 + cp -prL --no-dereference LICENSE.txt NOTICE.txt /usr/src/tmp/boilerpipe-buildroot/usr/share/doc/boilerpipe-javadoc-1.2.0 + chmod -R go-w /usr/src/tmp/boilerpipe-buildroot/usr/share/doc/boilerpipe-javadoc-1.2.0 + chmod -R a+rX /usr/src/tmp/boilerpipe-buildroot/usr/share/doc/boilerpipe-javadoc-1.2.0 + exit 0 Finding Provides (using /usr/lib/rpm/find-provides) Executing: /bin/sh -e /usr/src/tmp/rpm-tmp.JC0lrw find-provides: running scripts (alternatives,debuginfo,lib,maven,osgi-fc,pam,perl,pkgconfig,python,shell) Finding Requires (using /usr/lib/rpm/find-requires) Executing: /bin/sh -e /usr/src/tmp/rpm-tmp.i7WDWx find-requires: running scripts (cpp,debuginfo,files,javadoc,lib,maven,osgi-fc,pam,perl,pkgconfig,pkgconfiglib,python,rpmlib,shebang,shell,static,symlinks,systemd-services) Requires: javapackages-filesystem Wrote: /usr/src/RPM/RPMS/noarch/boilerpipe-1.2.0-alt1_13jpp8.noarch.rpm Wrote: /usr/src/RPM/RPMS/noarch/boilerpipe-javadoc-1.2.0-alt1_13jpp8.noarch.rpm 25.40user 1.81system 0:18.80elapsed 144%CPU (0avgtext+0avgdata 135000maxresident)k 0inputs+0outputs (0major+403502minor)pagefaults 0swaps /.out/boilerpipe-1.2.0-alt1_13jpp8.noarch.rpm: license not found in '/usr/share/license' directory: ASL /.out/boilerpipe-1.2.0-alt1_13jpp8.noarch.rpm: license not found in '/usr/share/license' directory: 2.0 /.out/boilerpipe-javadoc-1.2.0-alt1_13jpp8.noarch.rpm: license not found in '/usr/share/license' directory: ASL /.out/boilerpipe-javadoc-1.2.0-alt1_13jpp8.noarch.rpm: license not found in '/usr/share/license' directory: 2.0 52.19user 7.74system 1:07.95elapsed 88%CPU (0avgtext+0avgdata 135000maxresident)k 1536inputs+0outputs (0major+1207392minor)pagefaults 0swaps --- boilerpipe-1.2.0-alt1_13jpp8.noarch.rpm.repo 2019-05-26 22:26:46.000000000 +0000 +++ boilerpipe-1.2.0-alt1_13jpp8.noarch.rpm.hasher 2020-12-04 18:52:46.912329011 +0000 @@ -7,3 +7,3 @@ /usr/share/maven-poms/boilerpipe.pom 100644 -Requires: javapackages-tools +Requires: javapackages-filesystem Requires: mvn(net.sourceforge.nekohtml:nekohtml) --- boilerpipe-javadoc-1.2.0-alt1_13jpp8.noarch.rpm.repo 2019-05-26 22:26:46.000000000 +0000 +++ boilerpipe-javadoc-1.2.0-alt1_13jpp8.noarch.rpm.hasher 2020-12-04 18:52:46.924329049 +0000 @@ -4,4 +4,5 @@ /usr/share/javadoc/boilerpipe 40755 -/usr/share/javadoc/boilerpipe/allclasses-frame.html 100644 -/usr/share/javadoc/boilerpipe/allclasses-noframe.html 100644 +/usr/share/javadoc/boilerpipe/allclasses-index.html 100644 +/usr/share/javadoc/boilerpipe/allclasses.html 100644 +/usr/share/javadoc/boilerpipe/allpackages-index.html 100644 /usr/share/javadoc/boilerpipe/constant-values.html 100644 @@ -25,3 +26,2 @@ /usr/share/javadoc/boilerpipe/de/l3s/boilerpipe/conditions/class-use/TextBlockCondition.html 100644 -/usr/share/javadoc/boilerpipe/de/l3s/boilerpipe/conditions/package-frame.html 100644 /usr/share/javadoc/boilerpipe/de/l3s/boilerpipe/conditions/package-summary.html 100644 @@ -37,3 +37,2 @@ /usr/share/javadoc/boilerpipe/de/l3s/boilerpipe/document/class-use/TextDocumentStatistics.html 100644 -/usr/share/javadoc/boilerpipe/de/l3s/boilerpipe/document/package-frame.html 100644 /usr/share/javadoc/boilerpipe/de/l3s/boilerpipe/document/package-summary.html 100644 @@ -45,3 +44,2 @@ /usr/share/javadoc/boilerpipe/de/l3s/boilerpipe/estimators/class-use/SimpleEstimator.html 100644 -/usr/share/javadoc/boilerpipe/de/l3s/boilerpipe/estimators/package-frame.html 100644 /usr/share/javadoc/boilerpipe/de/l3s/boilerpipe/estimators/package-summary.html 100644 @@ -71,3 +69,2 @@ /usr/share/javadoc/boilerpipe/de/l3s/boilerpipe/extractors/class-use/NumWordsRulesExtractor.html 100644 -/usr/share/javadoc/boilerpipe/de/l3s/boilerpipe/extractors/package-frame.html 100644 /usr/share/javadoc/boilerpipe/de/l3s/boilerpipe/extractors/package-summary.html 100644 @@ -92,3 +89,2 @@ /usr/share/javadoc/boilerpipe/de/l3s/boilerpipe/filters/english/class-use/TerminatingBlocksFinder.html 100644 -/usr/share/javadoc/boilerpipe/de/l3s/boilerpipe/filters/english/package-frame.html 100644 /usr/share/javadoc/boilerpipe/de/l3s/boilerpipe/filters/english/package-summary.html 100644 @@ -116,3 +112,2 @@ /usr/share/javadoc/boilerpipe/de/l3s/boilerpipe/filters/heuristics/class-use/SimpleBlockFusionProcessor.html 100644 -/usr/share/javadoc/boilerpipe/de/l3s/boilerpipe/filters/heuristics/package-frame.html 100644 /usr/share/javadoc/boilerpipe/de/l3s/boilerpipe/filters/heuristics/package-summary.html 100644 @@ -140,3 +135,2 @@ /usr/share/javadoc/boilerpipe/de/l3s/boilerpipe/filters/simple/class-use/SurroundingToContentFilter.html 100644 -/usr/share/javadoc/boilerpipe/de/l3s/boilerpipe/filters/simple/package-frame.html 100644 /usr/share/javadoc/boilerpipe/de/l3s/boilerpipe/filters/simple/package-summary.html 100644 @@ -152,3 +146,2 @@ /usr/share/javadoc/boilerpipe/de/l3s/boilerpipe/labels/class-use/LabelAction.html 100644 -/usr/share/javadoc/boilerpipe/de/l3s/boilerpipe/labels/package-frame.html 100644 /usr/share/javadoc/boilerpipe/de/l3s/boilerpipe/labels/package-summary.html 100644 @@ -156,3 +149,2 @@ /usr/share/javadoc/boilerpipe/de/l3s/boilerpipe/labels/package-use.html 100644 -/usr/share/javadoc/boilerpipe/de/l3s/boilerpipe/package-frame.html 100644 /usr/share/javadoc/boilerpipe/de/l3s/boilerpipe/package-summary.html 100644 @@ -192,3 +184,2 @@ /usr/share/javadoc/boilerpipe/de/l3s/boilerpipe/sax/class-use/TagActionMap.html 100644 -/usr/share/javadoc/boilerpipe/de/l3s/boilerpipe/sax/package-frame.html 100644 /usr/share/javadoc/boilerpipe/de/l3s/boilerpipe/sax/package-summary.html 100644 @@ -200,3 +191,2 @@ /usr/share/javadoc/boilerpipe/de/l3s/boilerpipe/util/class-use/UnicodeTokenizer.html 100644 -/usr/share/javadoc/boilerpipe/de/l3s/boilerpipe/util/package-frame.html 100644 /usr/share/javadoc/boilerpipe/de/l3s/boilerpipe/util/package-summary.html 100644 @@ -205,2 +195,3 @@ /usr/share/javadoc/boilerpipe/deprecated-list.html 100644 +/usr/share/javadoc/boilerpipe/element-list 100644 /usr/share/javadoc/boilerpipe/help-doc.html 100644 @@ -208,10 +199,51 @@ /usr/share/javadoc/boilerpipe/index.html 100644 -/usr/share/javadoc/boilerpipe/overview-frame.html 100644 +/usr/share/javadoc/boilerpipe/jquery 40755 +/usr/share/javadoc/boilerpipe/jquery/external 40755 +/usr/share/javadoc/boilerpipe/jquery/external/jquery 40755 +/usr/share/javadoc/boilerpipe/jquery/external/jquery/jquery.js 100644 +/usr/share/javadoc/boilerpipe/jquery/images 40755 +/usr/share/javadoc/boilerpipe/jquery/images/ui-bg_glass_55_fbf9ee_1x400.png 100644 +/usr/share/javadoc/boilerpipe/jquery/images/ui-bg_glass_65_dadada_1x400.png 100644 +/usr/share/javadoc/boilerpipe/jquery/images/ui-bg_glass_75_dadada_1x400.png 100644 +/usr/share/javadoc/boilerpipe/jquery/images/ui-bg_glass_75_e6e6e6_1x400.png 100644 +/usr/share/javadoc/boilerpipe/jquery/images/ui-bg_glass_95_fef1ec_1x400.png 100644 +/usr/share/javadoc/boilerpipe/jquery/images/ui-bg_highlight-soft_75_cccccc_1x100.png 100644 +/usr/share/javadoc/boilerpipe/jquery/images/ui-icons_222222_256x240.png 100644 +/usr/share/javadoc/boilerpipe/jquery/images/ui-icons_2e83ff_256x240.png 100644 +/usr/share/javadoc/boilerpipe/jquery/images/ui-icons_454545_256x240.png 100644 +/usr/share/javadoc/boilerpipe/jquery/images/ui-icons_888888_256x240.png 100644 +/usr/share/javadoc/boilerpipe/jquery/images/ui-icons_cd0a0a_256x240.png 100644 +/usr/share/javadoc/boilerpipe/jquery/jquery-3.5.1.js 100644 +/usr/share/javadoc/boilerpipe/jquery/jquery-ui.css 100644 +/usr/share/javadoc/boilerpipe/jquery/jquery-ui.js 100644 +/usr/share/javadoc/boilerpipe/jquery/jquery-ui.min.css 100644 +/usr/share/javadoc/boilerpipe/jquery/jquery-ui.min.js 100644 +/usr/share/javadoc/boilerpipe/jquery/jquery-ui.structure.css 100644 +/usr/share/javadoc/boilerpipe/jquery/jquery-ui.structure.min.css 100644 +/usr/share/javadoc/boilerpipe/jquery/jszip 40755 +/usr/share/javadoc/boilerpipe/jquery/jszip-utils 40755 +/usr/share/javadoc/boilerpipe/jquery/jszip-utils/dist 40755 +/usr/share/javadoc/boilerpipe/jquery/jszip-utils/dist/jszip-utils-ie.js 100644 +/usr/share/javadoc/boilerpipe/jquery/jszip-utils/dist/jszip-utils-ie.min.js 100644 +/usr/share/javadoc/boilerpipe/jquery/jszip-utils/dist/jszip-utils.js 100644 +/usr/share/javadoc/boilerpipe/jquery/jszip-utils/dist/jszip-utils.min.js 100644 +/usr/share/javadoc/boilerpipe/jquery/jszip/dist 40755 +/usr/share/javadoc/boilerpipe/jquery/jszip/dist/jszip.js 100644 +/usr/share/javadoc/boilerpipe/jquery/jszip/dist/jszip.min.js 100644 +/usr/share/javadoc/boilerpipe/member-search-index.js 100644 +/usr/share/javadoc/boilerpipe/member-search-index.zip 100644 /usr/share/javadoc/boilerpipe/overview-summary.html 100644 /usr/share/javadoc/boilerpipe/overview-tree.html 100644 -/usr/share/javadoc/boilerpipe/package-list 100644 +/usr/share/javadoc/boilerpipe/package-search-index.js 100644 +/usr/share/javadoc/boilerpipe/package-search-index.zip 100644 +/usr/share/javadoc/boilerpipe/resources 40755 +/usr/share/javadoc/boilerpipe/resources/glass.png 100644 +/usr/share/javadoc/boilerpipe/resources/x.png 100644 /usr/share/javadoc/boilerpipe/script.js 100644 +/usr/share/javadoc/boilerpipe/search.js 100644 /usr/share/javadoc/boilerpipe/serialized-form.html 100644 /usr/share/javadoc/boilerpipe/stylesheet.css 100644 -Requires: javapackages-tools +/usr/share/javadoc/boilerpipe/type-search-index.js 100644 +/usr/share/javadoc/boilerpipe/type-search-index.zip 100644 +Requires: javapackages-filesystem Requires: rpmlib(PayloadIsLzma)