updated to the new pikotools api (api2021): HTMLFilter renamed to HTMLParser

added to config: int html_filter_white_char_mode;
  how white characters between html tags are treated
  0 - WHITE_MODE_ORIGIN - they are copied from input to output
  1 - WHITE_MODE_SINGLE_LINE - new line characters are removed
  2 - WHITE_MODE_TREE - try to create a tree (some kind of pretty printing)
  default: 2
This commit is contained in:
2021-08-07 02:16:48 +02:00
parent 22134b6cc0
commit b424988d1b
22 changed files with 369 additions and 175 deletions

View File

@@ -235,9 +235,8 @@ void Config::AssignValues(bool stdout_is_closed)
compression_page_min_size = Size(L"compression_page_min_size", 512);
compression_encoding = Int(L"compression_encoding", 20);
html_filter = Bool(L"html_filter", true);
html_filter_trim_white = Bool(L"html_filter_trim_white", true);
html_filter_break_word = Int(L"html_filter_break_word", 60);
html_filter = Bool(L"html_filter", false);
html_filter_white_char_mode = Int(L"html_filter_white_char_mode", 2);
html_filter_wrap_line = Int(L"html_filter_wrap_line", 110);
html_filter_tabs = Size(L"html_filter_tabs", 2);
html_filter_orphans = Bool(L"html_filter_orphans", true);