backup Hatena Space
by
a-kuma3
2016-01-23 [2016/01/23 16:57:58]
backup Hatena Space. see http://a-kuma3.hatenablog.com/entry/hatena_space_backup
@@ -101,163 +101,172 @@
var xhr = new XMLHttpRequest();
xhr.onload = function(e) {
if (e.target.status <= 200) {
- var doc = e.target.response;
- hspace_title = doc.querySelector("head title").innerHTML;
- var entry_container = doc.querySelector("div#entries");
-
- if (max_page == -1) {
- var last_entry = entry_container.querySelector("div.entry");
- last_entry_number = parseInt(last_entry.dataset.entryNumber, 10);
- max_page = Math.ceil(last_entry_number / 20.0);
- }
+ treatResponse(e.target.response);
+ }
+ };
- // remove entries of other users
- if (opt.only_my_entry) {
- try {
- var myid = doc.documentElement.dataset.userName;
- var re = new RegExp("/" + myid + "/$");
- Array.from(doc.querySelectorAll("div.entry div.author > a[href]")).forEach(function(e) {
- if (! re.test(e.href)) {
- removeNode(e.parentNode.parentNode.parentNode);
- }
- });
- } catch (ex) {
- console.error("ERROR: " + e.target.responseURL);
- console.error(ex);
- }
- }
+ function is_spam(entry) {
+ /*
+ TODO:
+ another spam pattern
+ */
+ var re = new RegExp("^https?://\\S+$");
+ if (re.test(entry.textContent)) {
+ return true;
+ }
- // remove spam entries
- {
- /*
- TODO:
- another spam pattern
- */
- var re = new RegExp("^https?://\\S+$");
- Array.from(doc.querySelectorAll("div.entry > div.body > div.plain")).forEach(function(e) {
- if (re.test(e.textContent)) {
- console.log("maybe spam: " + e.parentNode.parentNode.querySelector("div.author").textContent.replace(/\s/g, ""));
- removeNode(e.parentNode.parentNode);
- }
- });
- }
+ return false;
+ }
+
+ function treatResponse(resp) {
+ hspace_title = resp.querySelector("head title").innerHTML;
+ var entries = resp.querySelector("div#entries");
+
+ if (max_page == -1) {
+ var last_entry = entries.querySelector("div.entry");
+ last_entry_number = parseInt(last_entry.dataset.entryNumber, 10);
+ max_page = Math.ceil(last_entry_number / 20.0);
+ }
- // change user link space to profile of user
- {
- var sel = [
- "a.author-image-link",
- "div.meta > .author > a",
- "ul.comment-list > li > a",
- "ul.comment-list > li > .user-comment > a",
- "a.id-call",
- ].join(",");
- Array.from(doc.querySelectorAll(sel)).forEach(function(e) {
- e.href = e.href.replace(/space\.hatena\.ne\.jp/, "profile.hatena.ne.jp");
+ // remove entries of other users
+ if (opt.only_my_entry) {
+ try {
+ var myid = resp.documentElement.dataset.userName;
+ var re = new RegExp("/" + myid + "/$");
+ Array.from(entries.querySelectorAll("div.entry div.author > a[href]")).forEach(function(e) {
+ if (! re.test(e.href)) {
+ removeNode(e.parentNode.parentNode.parentNode);
+ }
});
+ } catch (ex) {
+ console.error("ERROR: " + e.target.responseURL);
+ console.error(ex);
}
+ }
- // display all comments
- Array.from(doc.querySelectorAll("div.comments > ul.comment-list li.hide")).forEach(function(e) {
- e.classList.remove("hide");
+ // remove spam entries
+ Array.from(entries.querySelectorAll("div.entry > div.body > div.plain")).forEach(function(e) {
+ if (is_spam(e)) {
+ console.log("maybe spam: " + e.parentNode.parentNode.querySelector("div.author").textContent.replace(/\s/g, ""));
+ removeNode(e.parentNode.parentNode);
+ }
+ });
+
+ // change user link space to profile of user
+ {
+ var sel = [
+ "a.author-image-link",
+ "div.meta > .author > a",
+ "ul.comment-list > li > a",
+ "ul.comment-list > li > .user-comment > a",
+ "a.id-call",
+ ].join(",");
+ Array.from(entries.querySelectorAll(sel)).forEach(function(e) {
+ e.href = e.href.replace(/space\.hatena\.ne\.jp/, "profile.hatena.ne.jp");
});
+ }
- // remove node (reduce size)
- {
- var sel = [
- // post form
- "div.comments > form.post-comment",
- "div.reply-action > form.quick-reply",
-
- // action element
- "div.comments > a.expand-comments",
- "ul.comment-list li div.comment-data > a.delete-comment",
- "div.reply-action > a.open-entry-menu",
- "div.reply-action > ul.entry-menu",
-
- // star button
- "div.reply-action button.star-add-button",
- ].join(",");
- Array.from(doc.querySelectorAll(sel)).forEach(function(e) {
- removeNode(e);
- });
- }
+ // display all comments
+ Array.from(entries.querySelectorAll("div.comments > ul.comment-list li.hide")).forEach(function(e) {
+ e.classList.remove("hide");
+ });
+
+ // remove node (reduce size)
+ {
+ var sel = [
+ // post form
+ "div.comments > form.post-comment",
+ "div.reply-action > form.quick-reply",
+
+ // action element
+ "div.comments > a.expand-comments",
+ "ul.comment-list li div.comment-data > a.delete-comment",
+ "div.reply-action > a.open-entry-menu",
+ "div.reply-action > ul.entry-menu",
+
+ // star button
+ "div.reply-action button.star-add-button",
+ ].join(",");
+ Array.from(entries.querySelectorAll(sel)).forEach(function(e) {
+ removeNode(e);
+ });
+ }
- // Hatena Star
- if (opt.expand_hatena_star) {
- var keys = [];
- Array.from(doc.querySelectorAll(".star-list-container")).forEach(function(e) {
- keys.push(e.dataset.resourceKey);
- });
- var url = "http://space.hatena.ne.jp/-/api/star?" + keys.map(function(e) {
- return "resource_key[]=" + e;
- }).join("&");
- var xx = new XMLHttpRequest();
- xx.open('GET', url, true);
- xx.onload = (function() {
- var ec = entry_container;
- return function(ev) {
- var a;
- eval("a=" + ev.target.responseText);
- a.resources.forEach(function(e) {
+ // Hatena Star
+ if (opt.expand_hatena_star) {
+ var keys = [];
+ Array.from(entries.querySelectorAll(".star-list-container")).forEach(function(e) {
+ keys.push(e.dataset.resourceKey);
+ });
+ var url = "http://space.hatena.ne.jp/-/api/star?" + keys.map(function(e) {
+ return "resource_key[]=" + e;
+ }).join("&");
+ var xx = new XMLHttpRequest();
+ xx.open('GET', url, true);
+ xx.onload = (function() {
+ var ec = entries;
+ return function(ev) {
+ var a;
+ eval("a=" + ev.target.responseText);
+ a.resources.forEach(function(e) {
//console.log(e);
- e.stars.forEach(function(ee) {
- var stcn = ec.querySelector('span.star-list-container[data-resource-key="' + ee.resource_key + '"]');
- var box = d_.createElement("span");
- box.className = "star-box";
- box.style.backgroundImage="url(" + ee.user.profile_image + ")";
- var img = d_.createElement("a");
- img.className = "star-image";
- img.href = "http://s.hatena.ne.jp" + ee.user.path;
- img.innerHTML = ee.user.name;
- box.appendChild(img);
- stcn.appendChild(box);
- });
+ e.stars.forEach(function(ee) {
+ var stcn = ec.querySelector('span.star-list-container[data-resource-key="' + ee.resource_key + '"]');
+ var box = d_.createElement("span");
+ box.className = "star-box";
+ box.style.backgroundImage="url(" + ee.user.profile_image + ")";
+ var img = d_.createElement("a");
+ img.className = "star-image";
+ img.href = "http://s.hatena.ne.jp" + ee.user.path;
+ img.innerHTML = ee.user.name;
+ box.appendChild(img);
+ stcn.appendChild(box);
});
- if (is_last_page) {
- finishLoading();
- }
- };
- })();
- xx.send(null);
- } else {
- var sel = [
- "div.reply-action div.star-container",
- ].join(",");
- Array.from(doc.querySelectorAll(sel)).forEach(function(e) {
- removeNode(e);
- });
- }
-
- // post time
- Array.from(doc.querySelectorAll("time")).forEach(function(e) {
- function d2(n) {
- return n < 9 ? "0"+n : n;
- }
- var t = new Date(parseInt(e.dataset.epochMilliseconds));
- e.innerHTML = t.getFullYear() + "/" + d2(t.getMonth()+1) + "/" + d2(t.getDate()) + " " +
- d2(t.getHours()) + ":" + d2(t.getMinutes()) + ":" + d2(t.getSeconds());
+ });
+ if (is_last_page) {
+ finishLoading();
+ }
+ };
+ })();
+ xx.send(null);
+ } else {
+ var sel = [
+ "div.reply-action div.star-container",
+ ].join(",");
+ Array.from(entries.querySelectorAll(sel)).forEach(function(e) {
+ removeNode(e);
});
+ }
+ // post time
+ Array.from(entries.querySelectorAll("time")).forEach(function(e) {
+ function d2(n) {
+ return n < 10 ? "0"+n : n;
+ }
+ var t = new Date(parseInt(e.dataset.epochMilliseconds));
+ e.innerHTML = t.getFullYear() + "/" + d2(t.getMonth()+1) + "/" + d2(t.getDate()) + " " +
+ d2(t.getHours()) + ":" + d2(t.getMinutes()) + ":" + d2(t.getSeconds());
+ });
+
+
+ hspace_pages.push(entries);
+
+ if (need_break) {
+ $id("progress").innerHTML = "BREAK Loading !";
+ return;
+ }
- hspace_pages.push(entry_container);
-
- if (need_break) {
- $id("progress").innerHTML = "BREAK Loading !";
- return;
- }
-
- is_last_page = !doc.querySelector("#timeline-pager-loading");
- if (is_last_page) {
- $id("progress").innerHTML = "FINISH Loading";
- if (! opt.expand_hatena_star) {
- setTimeout(finishLoading, 0);
- }
- } else {
- page += 1;
- loadEntries();
- }
+ is_last_page = !resp.querySelector("#timeline-pager-loading");
+ if (is_last_page) {
+ $id("progress").innerHTML = "FINISH Loading";
+ if (! opt.expand_hatena_star) {
+ setTimeout(finishLoading, 0);
+ }
+ } else {
+ page += 1;
+ loadEntries();
}
- };
+ }
function finishLoading() {
console.log("*** FINISH ***");
/*
* @title backup Hatena Space
* @description backup Hatena Space. see http://a-kuma3.hatenablog.com/entry/hatena_space_backup
* @include http://space.hatena.ne.jp/*
* @license MIT License
*/
(function(){
/*
[OPTIONS]
only_my_entry:
remove other users posts.
need login.
expand_hatena_star:
slower 10-50% to exract.
larger 10% or more.
embed_stylesheet:
need 218 KB more.
*/
var opt = {
only_my_entry: false,
expand_hatena_star: false,
embed_stylesheet: true,
};
// check location
re_check = new RegExp("^http://space\.hatena\.ne\.jp/~/\\d+/\\d+#?$");
if (! re_check.test(location.href)) {
console.log('"' + location.href + '"');
alert("use at topics page @ space.hatena.ne.jp.");
return;
}
var hspace_pages = [];
var hspace_stylesheet = "";
var hspace_title = "";
var need_break = false;
var is_last_page = false;
var page = 1;
var max_page = -1;
var last_entry_number = -1;
var d_ = document;
var b_ = d_.body;
var style_url = "http://space.hatena.ne.jp/css/master.css?47ab9942";
var t_start = new Date();
function setStyle(target, prop) {
for (k in prop) {
target.style[k] = prop[k];
}
}
function removeNode(e) {
e.parentNode.removeChild(e);
}
function $id(id) {
return d_.getElementById(id);
}
function createProgressView() {
if ($id("progress")) {
removeNode($id("progress").parentNode);
}
var panel = d_.createElement("DIV");
setStyle(panel, {
display: "inline-block",
position: "fixed",
top: "1ex",
right: "1ex",
backgroundColor: "green",
border: "2px inset darkgreen",
color: "white",
padding: "0.5ex 2ex",
zIndex: 1000,
});
var m = d_.createElement("DIV");
m.id = "progress";
m.innerHTML = " ";
panel.appendChild(m);
var btn = d_.createElement("BUTTON");
btn.innerHTML = "BREAK";
btn.style.marginTop = "0.5em";
btn.onclick = function() {
need_break = true;
};
panel.appendChild(btn);
b_.appendChild(panel);
}
var xhr = new XMLHttpRequest();
xhr.onload = function(e) {
if (e.target.status <= 200) {
treatResponse(e.target.response);
}
};
function is_spam(entry) {
/*
TODO:
another spam pattern
*/
var re = new RegExp("^https?://\\S+$");
if (re.test(entry.textContent)) {
return true;
}
return false;
}
function treatResponse(resp) {
hspace_title = resp.querySelector("head title").innerHTML;
var entries = resp.querySelector("div#entries");
if (max_page == -1) {
var last_entry = entries.querySelector("div.entry");
last_entry_number = parseInt(last_entry.dataset.entryNumber, 10);
max_page = Math.ceil(last_entry_number / 20.0);
}
// remove entries of other users
if (opt.only_my_entry) {
try {
var myid = resp.documentElement.dataset.userName;
var re = new RegExp("/" + myid + "/$");
Array.from(entries.querySelectorAll("div.entry div.author > a[href]")).forEach(function(e) {
if (! re.test(e.href)) {
removeNode(e.parentNode.parentNode.parentNode);
}
});
} catch (ex) {
console.error("ERROR: " + e.target.responseURL);
console.error(ex);
}
}
// remove spam entries
Array.from(entries.querySelectorAll("div.entry > div.body > div.plain")).forEach(function(e) {
if (is_spam(e)) {
console.log("maybe spam: " + e.parentNode.parentNode.querySelector("div.author").textContent.replace(/\s/g, ""));
removeNode(e.parentNode.parentNode);
}
});
// change user link space to profile of user
{
var sel = [
"a.author-image-link",
"div.meta > .author > a",
"ul.comment-list > li > a",
"ul.comment-list > li > .user-comment > a",
"a.id-call",
].join(",");
Array.from(entries.querySelectorAll(sel)).forEach(function(e) {
e.href = e.href.replace(/space\.hatena\.ne\.jp/, "profile.hatena.ne.jp");
});
}
// display all comments
Array.from(entries.querySelectorAll("div.comments > ul.comment-list li.hide")).forEach(function(e) {
e.classList.remove("hide");
});
// remove node (reduce size)
{
var sel = [
// post form
"div.comments > form.post-comment",
"div.reply-action > form.quick-reply",
// action element
"div.comments > a.expand-comments",
"ul.comment-list li div.comment-data > a.delete-comment",
"div.reply-action > a.open-entry-menu",
"div.reply-action > ul.entry-menu",
// star button
"div.reply-action button.star-add-button",
].join(",");
Array.from(entries.querySelectorAll(sel)).forEach(function(e) {
removeNode(e);
});
}
// Hatena Star
if (opt.expand_hatena_star) {
var keys = [];
Array.from(entries.querySelectorAll(".star-list-container")).forEach(function(e) {
keys.push(e.dataset.resourceKey);
});
var url = "http://space.hatena.ne.jp/-/api/star?" + keys.map(function(e) {
return "resource_key[]=" + e;
}).join("&");
var xx = new XMLHttpRequest();
xx.open('GET', url, true);
xx.onload = (function() {
var ec = entries;
return function(ev) {
var a;
eval("a=" + ev.target.responseText);
a.resources.forEach(function(e) {
//console.log(e);
e.stars.forEach(function(ee) {
var stcn = ec.querySelector('span.star-list-container[data-resource-key="' + ee.resource_key + '"]');
var box = d_.createElement("span");
box.className = "star-box";
box.style.backgroundImage="url(" + ee.user.profile_image + ")";
var img = d_.createElement("a");
img.className = "star-image";
img.href = "http://s.hatena.ne.jp" + ee.user.path;
img.innerHTML = ee.user.name;
box.appendChild(img);
stcn.appendChild(box);
});
});
if (is_last_page) {
finishLoading();
}
};
})();
xx.send(null);
} else {
var sel = [
"div.reply-action div.star-container",
].join(",");
Array.from(entries.querySelectorAll(sel)).forEach(function(e) {
removeNode(e);
});
}
// post time
Array.from(entries.querySelectorAll("time")).forEach(function(e) {
function d2(n) {
return n < 10 ? "0"+n : n;
}
var t = new Date(parseInt(e.dataset.epochMilliseconds));
e.innerHTML = t.getFullYear() + "/" + d2(t.getMonth()+1) + "/" + d2(t.getDate()) + " " +
d2(t.getHours()) + ":" + d2(t.getMinutes()) + ":" + d2(t.getSeconds());
});
hspace_pages.push(entries);
if (need_break) {
$id("progress").innerHTML = "BREAK Loading !";
return;
}
is_last_page = !resp.querySelector("#timeline-pager-loading");
if (is_last_page) {
$id("progress").innerHTML = "FINISH Loading";
if (! opt.expand_hatena_star) {
setTimeout(finishLoading, 0);
}
} else {
page += 1;
loadEntries();
}
}
function finishLoading() {
console.log("*** FINISH ***");
displayResultView();
console.log("display initialized");
displaySource();
console.log("source displayed");
var lapse = (new Date().getTime() - t_start.getTime()) / 1000;
console.log("=== COMPLETE === " + [
lapse + " sec",
max_page + " pages",
last_entry_number + " posts",
].join(", "));
}
function displayResultView() {
b_.innerHTML = "";
b_.classList.remove("new-space");
// source area
var sourceArea = d_.createElement("div");
setStyle(sourceArea, {
display: "inline-block",
width: "20em",
padding: "0.5ex 2ex",
backgroundColor: "palegoldenrod",
verticalAlign: "top",
});
function createUnitArea(dest, title, id, viewtype) {
var e_txt = d_.createElement("textarea");
e_txt.id = "source-" + id;
e_txt.rows = 5;
setStyle(e_txt, {
width: "100%",
display: "block",
});
var e_title = d_.createElement("a");
e_title.innerHTML = title;
e_title.href = "#";
setStyle(e_title, {
display: "block",
textDecoration: "underline",
borderLeft: "1em solid saddlebrown",
paddingLeft: "1ex",
marginTop: "0.5ex",
});
e_title.onclick = function() {
var viewArea = $id("view-area");
var dd_ = viewArea.contentWindow.document;
dd_.open(viewtype, "replace");
// dd_.charset = "Shift_JIS";
dd_.write(this.nextSibling.value);
dd_.close();
return false;
};
dest.appendChild(e_title);
dest.appendChild(e_txt);
}
createUnitArea(sourceArea, "entries HTML" , "entries" , "text/html");
createUnitArea(sourceArea, "style sheet" , "stylesheet", "text/plain");
createUnitArea(sourceArea, "images URL list", "imagelist" , "text/plain");
createUnitArea(sourceArea, "images HTML" , "imagepage" , "text/html");
b_.appendChild(sourceArea);
// preview frame
var viewArea = d_.createElement("iframe");
viewArea.id = "view-area";
setStyle(viewArea, {
width: "600px",
height: window.innerHeight + "px",
display: "inline-block",
verticalAlign: "top",
});
b_.appendChild(viewArea);
}
function code_stylesheet() {
var code = [
'<!-- need replace -->',
'<link rel="stylesheet" href="' + style_url + '" />',
].join("\n");
if (opt.embed_stylesheet) {
code = [
'<style>',
hspace_stylesheet,
'</style>',
].join("\n");
}
var star_image = [
"<style>",
".star-image {",
"background-image: url() !important;",
"}",
"</style>",
].join("\n");
return code + star_image;
}
function displaySource() {
// contents
var e = $id("source-entries");
e.value = [].concat([
"<!DOCTYPE html>",
"<html>",
'<head>',
'<meta charset="utf-8">',
'<title>' + hspace_title + "(アーカイブ)" + '</title>',
code_stylesheet(),
'</head>',
'<body>',
'<div id="main-container" style="width: 538px;">',
'<div class="container">',
'<div id="entry-container" class="entry-box">',
'<div id="entries">',
],
hspace_pages.map(function(e) {
return e.innerHTML;
}),
[
'</div>',
'</div>',
'</div>',
'</div>',
'</body>',
"</html>"
]).join("\n");
// image list
var image_list = [];
hspace_pages.forEach(function(e) {
Array.from(e.querySelectorAll('a[href^="http://cdn.mogile.archive.st-hatena.com/v1/image/"]')).forEach(function(a) {
image_list.push(a.href);
});
});
if (image_list.length > 0) {
// only url
e = $id("source-imagelist");
e.value = image_list.join("\n");
// thumbnail page
e = $id("source-imagepage");
e.value = [
"<!DOCTYPE html>",
"<html>",
"<head>",
"<title>",
hspace_title + "(アーカイブ:画像)",
"</title>",
"<style>",
"body {padding: 1ex;}",
"img {padding: 1ex;border: 1px solid gray; max-width: 100%;}",
"</style>",
"</head>",
"<body>",
image_list.map(function(e) {
return '<img src="' + e + '">';
}).join("\n"),
"</body>",
"</html>"].join("\n");
}
// stylesheet
var e = $id("source-stylesheet");
e.value = hspace_stylesheet;
}
function loadStyleSheet() {
var xx = new XMLHttpRequest();
xx.open('GET', style_url, true);
xx.onload = function(ev) {
hspace_stylesheet = ev.target.responseText;
};
xx.send(null);
}
function loadEntries() {
var msg = "Loading page:" + page + " / " + (max_page == -1 ? "?" : max_page) + " ...";
console.log(msg);
$id("progress").innerHTML = msg;
xhr.open('GET', location.pathname + "?p=" + page, true);
xhr.responseType = 'document';
xhr.send(null);
};
// opt.only_my_entry = confirm([
// "Only my POST ?",
// "",
// " OK : only my posts (need login)",
// " Cancel : all posts"
// ].join("\n"));
createProgressView();
loadEntries();
loadStyleSheet();
}());
- Permalink
- このページへの個別リンクです。
- RAW
- 書かれたコードへの直接のリンクです。
- Packed
- 文字列が圧縮された書かれたコードへのリンクです。
- Userscript
- Greasemonkey 等で利用する場合の .user.js へのリンクです。
- Loader
- @require やソースコードが長い場合に多段ロードする Loader コミのコードへのリンクです。
- Metadata
- コード中にコメントで @xxx と書かれたメタデータの JSON です。