blob: 768e2700401fcd2bf7a9d729d2dcf67791cc7474 (
plain) (
blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
|
// Represents all functions for process the raw HTML and
// extracting information from it, transforming it, etc.
// All fns operate on strings.
import std.algorithm : findSplitAfter, find;
// Given the haystack (the full HTML) search for the RSS comment
// representing that attribute.
string find_rss_comment(string attr, string haystack)
in (haystack !is null)
{
immutable string needle = "<!-- rss-" ~ attr ~ ":";
string found = haystack.find(needle);
if (found is null)
return null;
// As otherwise comment begin will be in `found`.
found = found[needle.length .. $];
// And get before the closing comment.
string result = found.findSplitAfter("-->")[0];
return result;
}
string find_html_title(string htmltext)
{
// TODO: implement.
immutable string init_tag = "<title>";
string found = htmltext.find(init_tag);
if (found is null)
return null;
found = found[init_tag.length .. $];
string result = found.findSplitAfter("</title>")[0];
return result;
}
|