// Example: Crawling a title of websites var FILE = require("lib/file"); var HTTP = require("lib/http"); var Punycode = require("lib/punycode"); function main() { var lines = []; var district = JSON.parse(FILE.readFile("data\\korea-administrative-district.json", FILE.CdoCharset.CdoUTF_8)); var districtData = district.data; var domains = splitLn(FILE.readFile("data\\domains.txt", FILE.CdoCharset.CdoUTF_8)); var digFrame = function(handler, domain, response) { var frameURLs = handler.getFrameURLs(); if (frameURLs.length > 0) { frameURLs.forEach(function(x) { var _handler = HTTP.create("CURL") .setUserAgent("Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/101.0.4951.67 Safari/537.36") .setIsFollowRedirect(true) .open("GET", "http://" + Punycode.encode(domain) + "/" + x) .send(); response += _handler.responseBody; response = digFrame(_handler, domain, response); }); } return response; }; domains.forEach(function(domain) { var handler = HTTP.create("CURL") .setUserAgent("Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/101.0.4951.67 Safari/537.36") .setIsFollowRedirect(true) .open("GET", "http://" + Punycode.encode(domain) + "/") .send(); var response = handler.responseBody; response = digFrame(handler, domain, response); var pos = response.search(/[0-9]{3}-[0-9]{2}-[0-9]{5}/g); console.log("Position:", pos); var bizNo = ''; if (pos > -1) { bizNo = response.substring(pos, pos + 12); } var a = response.indexOf("