<?xml version="1.0" encoding="UTF-8"?>
<rss version="2.0"
	xmlns:content="http://purl.org/rss/1.0/modules/content/"
	xmlns:wfw="http://wellformedweb.org/CommentAPI/"
	xmlns:dc="http://purl.org/dc/elements/1.1/"
	xmlns:atom="http://www.w3.org/2005/Atom"
	xmlns:sy="http://purl.org/rss/1.0/modules/syndication/"
	>

<channel>
	<title>SpiderMount</title>
	<atom:link href="http://www.webspidermount.com/blog/feed/" rel="self" type="application/rss+xml" />
	<link>http://www.webspidermount.com/blog</link>
	<description>Just another WordPress weblog</description>
	<pubDate>Fri, 11 Jun 2010 14:07:35 +0000</pubDate>
	<generator>http://wordpress.org/?v=2.7</generator>
	<language>en</language>
	<sy:updatePeriod>hourly</sy:updatePeriod>
	<sy:updateFrequency>1</sy:updateFrequency>
			<item>
		<title>Web Scraping Service</title>
		<link>http://www.webspidermount.com/blog/web-scraping-service-screen-data-harvesting/web-scraping/</link>
		<comments>http://www.webspidermount.com/blog/web-scraping-service-screen-data-harvesting/web-scraping/#comments</comments>
		<pubDate>Fri, 11 Jun 2010 14:03:37 +0000</pubDate>
		<dc:creator>Valerii Verbovetsky</dc:creator>
		
		<category><![CDATA[Web Scraping]]></category>

		<category><![CDATA[data extraction]]></category>

		<category><![CDATA[data mining]]></category>

		<category><![CDATA[screen scraping]]></category>

		<category><![CDATA[web harvesting]]></category>

		<guid isPermaLink="false">http://www.webspidermount.com/blog/?p=100</guid>
		<description><![CDATA[SpiderMount adds web scraping service to its software as service offering: screen scraping, data extraction, filtering and auto-posting.

Full service
SpiderMount does it all. Client provides URLs to spider and data posting instructions. SpiderMount support staff configures scraping, monitors  daily data extraction sessions, implements changes and outputs info.


More details:
web scraping service overivew
pricing


]]></description>
			<content:encoded><![CDATA[<p>SpiderMount adds web scraping service to its software as service offering: screen scraping, data extraction, filtering and auto-posting.<code><br />
</code><br />
<strong>Full service</strong><br />
SpiderMount does it all. Client provides URLs to spider and data posting instructions. SpiderMount support staff configures scraping, monitors  daily data extraction sessions, implements changes and outputs info.<br />
<code><br />
</code><br />
<strong>More details:</strong><br />
<a href="/cm/products/web_spider">web scraping service overivew</a><br />
<a href="/cm/pricing">pricing</a><br />
<code><br />
</code></p>
]]></content:encoded>
			<wfw:commentRss>http://www.webspidermount.com/blog/web-scraping-service-screen-data-harvesting/web-scraping/feed/</wfw:commentRss>
		</item>
		<item>
		<title>Replace Keywords And Improve Job Formatting</title>
		<link>http://www.webspidermount.com/blog/replace-keywords-and-improve-job-formatting/job-spider/</link>
		<comments>http://www.webspidermount.com/blog/replace-keywords-and-improve-job-formatting/job-spider/#comments</comments>
		<pubDate>Wed, 19 Aug 2009 07:17:55 +0000</pubDate>
		<dc:creator>Valerii Verbovetsky</dc:creator>
		
		<category><![CDATA[Job Spider]]></category>

		<guid isPermaLink="false">http://www.webspidermount.com/blog/?p=96</guid>
		<description><![CDATA[Job spider will search for keywords and phrases in source job HTML and replace or remove names, contacts, redundant HTML tags.


Set automatic keywords replacements for any part of original job  content: job description, title, contact info. Auto-post modified job posting to your database.
]]></description>
			<content:encoded><![CDATA[<p>Job spider will search for keywords and phrases in source job HTML and replace or remove names, contacts, redundant HTML tags.<br />
<code><br />
</code></p>
<p>Set automatic keywords replacements for any part of original job  content: job description, title, contact info. Auto-post modified job posting to your database.</p>
]]></content:encoded>
			<wfw:commentRss>http://www.webspidermount.com/blog/replace-keywords-and-improve-job-formatting/job-spider/feed/</wfw:commentRss>
		</item>
		<item>
		<title>Job Spider XML Interface For Bulk Posting</title>
		<link>http://www.webspidermount.com/blog/job-spider-xml-interface-for-bulk-posting/job-spider/</link>
		<comments>http://www.webspidermount.com/blog/job-spider-xml-interface-for-bulk-posting/job-spider/#comments</comments>
		<pubDate>Thu, 30 Apr 2009 15:19:26 +0000</pubDate>
		<dc:creator>Valerii Verbovetsky</dc:creator>
		
		<category><![CDATA[Configuration]]></category>

		<category><![CDATA[Job Spider]]></category>

		<guid isPermaLink="false">http://www.webspidermount.com/blog/?p=91</guid>
		<description><![CDATA[Job Spider auto-posts jobs packaged into XML file via HTTP.  A specific URL either obtains new jobs or removes expired ones. Whole process is automatically managed by Job Spider  scheduler.
 
Download XML/HTTP bulk posting interface description.
]]></description>
			<content:encoded><![CDATA[<p>Job Spider auto-posts jobs packaged into XML file via HTTP.  A specific URL either obtains new jobs or removes expired ones. Whole process is automatically managed by Job Spider  scheduler.</p>
<p> </p>
<p>Download <a href="http://www.webspidermount.com/download_files/Job_Spider_XML_Interface.pdf">XML/HTTP bulk posting interface description</a>.</p>
]]></content:encoded>
			<wfw:commentRss>http://www.webspidermount.com/blog/job-spider-xml-interface-for-bulk-posting/job-spider/feed/</wfw:commentRss>
		</item>
		<item>
		<title>Synchronize Jobs Via Incremental Scraping</title>
		<link>http://www.webspidermount.com/blog/sync-scraped-websites/job-spider/</link>
		<comments>http://www.webspidermount.com/blog/sync-scraped-websites/job-spider/#comments</comments>
		<pubDate>Mon, 06 Apr 2009 08:36:25 +0000</pubDate>
		<dc:creator>Valerii Verbovetsky</dc:creator>
		
		<category><![CDATA[Configuration]]></category>

		<category><![CDATA[Job Spider]]></category>

		<category><![CDATA[ATS]]></category>

		<category><![CDATA[incremental scraping]]></category>

		<category><![CDATA[posting]]></category>

		<category><![CDATA[scraping]]></category>

		<category><![CDATA[sync]]></category>

		<category><![CDATA[synchronization]]></category>

		<category><![CDATA[unique URLs]]></category>

		<guid isPermaLink="false">http://www.webspidermount.com/blog/?p=80</guid>
		<description><![CDATA[Keep your job listings up-to-date with source Employer websites by utilizing Synchronization feature of Job Spider. The tool will make sure only new jobs are added to your system and expire the vacancies removed from source websites.


Incremental scraping
Synchronization feature provides incremental downloads to make sure you don&#8217;t overload source websites with excessive requests, but only [...]]]></description>
			<content:encoded><![CDATA[<p>Keep your job listings up-to-date with source Employer websites by utilizing Synchronization feature of Job Spider. The tool will make sure only new jobs are added to your system and expire the vacancies removed from source websites.<br />
<code><br />
</code><br />
<strong>Incremental scraping<br />
<span style="font-weight: normal;">Synchronization feature provides <em>incremental</em> downloads to make sure you don&#8217;t overload source websites with excessive requests, but only download new jobs added to system.</span></strong><br />
<code><br />
</code></p>
<div><strong>Job Sync requirements:</strong></div>
<div>Job Sync feature requires HTTP/XML posting interface on a target job board.</div>
<div>The interface is to provide &#8220;Add&#8221; and &#8220;Remove&#8221; commands.</div>
<div>It is also to be able to return job ID to spider upon successful posting.</div>
<p><code><br />
</code></p>
<div><strong>Sync process:</strong></div>
<div>1. Spider runs search on Employer career center and assigns unique ID to each job / specific URL scraped.</div>
<div>2. Spider posts the job via HTTP/XML: posting interface of a Job Board returns unique job ID of each specific job posting.</div>
<div>3. Job Spider saves job ID from job board and links with Job ID of a Spider.</div>
<div>4. Next scraping sessions are done by spider. If the job is gone from job search results: job spider sends Remove ID command to job board XML interface.</div>
<div>5. Job board removes/expires the job.</div>
<p><code><br />
</code><br />
<strong>Job Spider screenshots:</strong></p>
<p><strong></strong><br />
Activate Synchronization for any scraping package/website:</p>
<p><img class="alignnone" title="Sync On" src="http://www.webspidermount.com/imglib/blog/allsync.jpg" alt="" width="525" height="165" /></p>
<p>Set job URL to be a unique identifier:</p>
<p><img class="alignnone" title="Sync by job URL" src="http://www.webspidermount.com/imglib/blog/set_job_sync.jpg" alt="" width="525" height="280" /></p>
<p>Resulting scraping sessions list:</p>
<p><img class="alignnone" title="Scraping package" src="http://www.webspidermount.com/imglib/blog/sync1.jpg" alt="" width="525" height="206" /></p>
<p>Hit &#8220;Items&#8221; to view jobs downloaded:</p>
<p>Replicating URLs (jobs scraped in earlier sessions) were not downloaded (<em>old</em> status):</p>
<p><img class="alignnone" title="old jobs" src="http://www.webspidermount.com/imglib/blog/sync3.jpg" alt="" width="525" height="164" /></p>
<p>Updates to the stored job data:<br />
- New: new jobs scraped during this session<br />
- Deleted: jobs removed from source website</p>
<p><img class="alignnone" title="Jobs list" src="http://www.webspidermount.com/imglib/blog/sync2.jpg" alt="" width="525" height="164" /></p>
<p><strong><br />
Posting to your job board / database:</strong><br />
Job Spider will synchronize jobs data with your recipient website or database.</p>
<p>Job ID from job board  (<em>Received ID</em>) will be received whilst posting and matched to Spider job ID (<em>Entity ID</em>):<br />
<img class="alignnone" title="job ids" src="http://www.webspidermount.com/imglib/blog/postids.jpg" alt="" width="491" height="166" /><br />
Jobs deleted from client source website will be removed from job board.</p>
]]></content:encoded>
			<wfw:commentRss>http://www.webspidermount.com/blog/sync-scraped-websites/job-spider/feed/</wfw:commentRss>
		</item>
		<item>
		<title>Posting To Multiple Websites</title>
		<link>http://www.webspidermount.com/blog/post_to_multiple_destinations/job-spider/</link>
		<comments>http://www.webspidermount.com/blog/post_to_multiple_destinations/job-spider/#comments</comments>
		<pubDate>Thu, 02 Apr 2009 09:41:15 +0000</pubDate>
		<dc:creator>Valerii Verbovetsky</dc:creator>
		
		<category><![CDATA[Configuration]]></category>

		<category><![CDATA[Job Spider]]></category>

		<category><![CDATA[multiple recipients]]></category>

		<category><![CDATA[post to multiple websites]]></category>

		<guid isPermaLink="false">http://www.webspidermount.com/blog/?p=76</guid>
		<description><![CDATA[A new feature is added to Job Spider to allow you to aggregate jobs and post to multiple websites of yours. 
 
Aggregrate jobs from various sources, filter out by keywords, set up various XML or CSV posting formats for recipient websites and post.
 
Frequency of scraping

Run your scraping sessions:
- either automatically daily or weekly
- or run manual [...]]]></description>
			<content:encoded><![CDATA[<p>A new feature is added to Job Spider to allow you to aggregate jobs and post to multiple websites of yours. </p>
<p> </p>
<p>Aggregrate jobs from various sources, filter out by keywords, set up various XML or CSV posting formats for recipient websites and post.</p>
<p> </p>
<p><strong>Frequency of scraping<br />
</strong></p>
<p>Run your scraping sessions:<br />
- either automatically daily or weekly<br />
- or run manual scrapes when required</p>
]]></content:encoded>
			<wfw:commentRss>http://www.webspidermount.com/blog/post_to_multiple_destinations/job-spider/feed/</wfw:commentRss>
		</item>
		<item>
		<title>Scrape Jobs And Export As CSV</title>
		<link>http://www.webspidermount.com/blog/scrape-and-compile-jobs-to-export-as-csv/job-spider/</link>
		<comments>http://www.webspidermount.com/blog/scrape-and-compile-jobs-to-export-as-csv/job-spider/#comments</comments>
		<pubDate>Fri, 27 Mar 2009 15:18:51 +0000</pubDate>
		<dc:creator>Valerii Verbovetsky</dc:creator>
		
		<category><![CDATA[Job Spider]]></category>

		<category><![CDATA[CSV file]]></category>

		<category><![CDATA[export]]></category>

		<category><![CDATA[post]]></category>

		<category><![CDATA[report]]></category>

		<category><![CDATA[spreadsheet]]></category>

		<guid isPermaLink="false">http://www.webspidermount.com/blog/?p=72</guid>
		<description><![CDATA[CSV files are configured via Job Spider tool to compile vacancy lists. CSV is both viewed as MS Excel spreadsheet and easily uploaded to most of databases.
 
Map CSVs for each source / job parsing configuration. Filter out desired vacancies from target career sites and compile into selected CSV files.
]]></description>
			<content:encoded><![CDATA[<p>CSV files are configured via Job Spider tool to compile vacancy lists. CSV is both viewed as MS Excel spreadsheet and easily uploaded to most of databases.</p>
<p> </p>
<p>Map CSVs for each source / job parsing configuration. Filter out desired vacancies from target career sites and compile into selected CSV files.</p>
]]></content:encoded>
			<wfw:commentRss>http://www.webspidermount.com/blog/scrape-and-compile-jobs-to-export-as-csv/job-spider/feed/</wfw:commentRss>
		</item>
		<item>
		<title>Jobs.co.za Subscribes For Scraping Service</title>
		<link>http://www.webspidermount.com/blog/jobscoza-integrates-job-spider/job-spider/</link>
		<comments>http://www.webspidermount.com/blog/jobscoza-integrates-job-spider/job-spider/#comments</comments>
		<pubDate>Fri, 06 Mar 2009 11:35:23 +0000</pubDate>
		<dc:creator>Valerii Verbovetsky</dc:creator>
		
		<category><![CDATA[Clients]]></category>

		<category><![CDATA[Job Spider]]></category>

		<guid isPermaLink="false">http://www.webspidermount.com/blog/?p=67</guid>
		<description><![CDATA[South African job portal subscribes for job spider service. Jobs collected are posted to a third party job board application interface.

 
Job scraping service pricing.
]]></description>
			<content:encoded><![CDATA[<p>South African job portal subscribes for job spider service. Jobs collected are posted to a third party job board application interface.</p>
<p><img class="alignnone" title="jobs co za" src="http://www.webspidermount.com/imglib/clients/jobscoza.jpg" alt="" width="525" height="74" /></p>
<p> </p>
<p>Job scraping service <a href="/cm/pricing/">pricing</a>.</p>
]]></content:encoded>
			<wfw:commentRss>http://www.webspidermount.com/blog/jobscoza-integrates-job-spider/job-spider/feed/</wfw:commentRss>
		</item>
		<item>
		<title>SAPJobFish Integrates Job Spider</title>
		<link>http://www.webspidermount.com/blog/sapjobfish-integrates-job-spider/job-spider/</link>
		<comments>http://www.webspidermount.com/blog/sapjobfish-integrates-job-spider/job-spider/#comments</comments>
		<pubDate>Thu, 05 Mar 2009 14:44:04 +0000</pubDate>
		<dc:creator>Valerii Verbovetsky</dc:creator>
		
		<category><![CDATA[Clients]]></category>

		<category><![CDATA[Job Spider]]></category>

		<category><![CDATA[hosted job spider service]]></category>

		<guid isPermaLink="false">http://www.webspidermount.com/blog/?p=62</guid>
		<description><![CDATA[Job Spider tool was configured for SAPJobFish.com a job board dedicated to deliver great matching service for SAP professionals.

 
Employer job openings are scraped from source websites and synchronized with JobMount job board software. JobMount job site product is seamlessly integrated with Job Spider. 
 
SAPJobFish is subscribed to hosted job spider service.
]]></description>
			<content:encoded><![CDATA[<p>Job Spider tool was configured for SAPJobFish.com a job board dedicated to deliver great matching service for SAP professionals.</p>
<p><img class="alignnone" title="job board" src="http://www.webspidermount.com/imglib/blog/bnr_sap.jpg" alt="" width="525" height="74" /></p>
<p> </p>
<p>Employer job openings are scraped from source websites and synchronized with JobMount <a href="http://www.jobboardmount.com" target="_blank">job board software</a>. JobMount job site product is seamlessly integrated with Job Spider. </p>
<p> </p>
<p>SAPJobFish is subscribed to <a href="/cm/pricing/">hosted job spider service</a>.</p>
]]></content:encoded>
			<wfw:commentRss>http://www.webspidermount.com/blog/sapjobfish-integrates-job-spider/job-spider/feed/</wfw:commentRss>
		</item>
		<item>
		<title>Job Scraping Example</title>
		<link>http://www.webspidermount.com/blog/job-scraping-example/job-spider/</link>
		<comments>http://www.webspidermount.com/blog/job-scraping-example/job-spider/#comments</comments>
		<pubDate>Tue, 24 Feb 2009 12:38:35 +0000</pubDate>
		<dc:creator>Valerii Verbovetsky</dc:creator>
		
		<category><![CDATA[Configuration]]></category>

		<category><![CDATA[Job Spider]]></category>

		<category><![CDATA[grab jobs]]></category>

		<category><![CDATA[html tags]]></category>

		<category><![CDATA[Job Listing]]></category>

		<category><![CDATA[job parsing]]></category>

		<category><![CDATA[job wrapping]]></category>

		<category><![CDATA[scraping]]></category>

		<category><![CDATA[source code]]></category>

		<category><![CDATA[spider configuration]]></category>

		<guid isPermaLink="false">http://www.webspidermount.com/blog/?p=57</guid>
		<description><![CDATA[Basic employer job search form usage, vacancy list spidering, parsing and XML generation example:
 
1. Job search form and list of jobs to spider:
- scrape all jobs or specify search criteria
- schedule for daily or weekly spidering
- filter out by desired / non-desired keywords

 
2. Job page downloading instructions abstract (Job Spider tool):
 
 
3. Example of a [...]]]></description>
			<content:encoded><![CDATA[<p>Basic employer job search form usage, vacancy list spidering, parsing and XML generation example:</p>
<p> </p>
<p><strong>1. Job search form and list of jobs to spider:</strong></p>
<p>- scrape all jobs or specify search criteria<br />
- schedule for daily or weekly spidering<br />
- filter out by desired / non-desired keywords</p>
<p><img src="http://www.webspidermount.com/imglib/demo/joblist.jpg" alt="list of jobs" /></p>
<p> </p>
<p><strong>2. Job page downloading instructions abstract (Job Spider tool):<br />
</strong> <img src="http://www.webspidermount.com/imglib/demo/jobscrape.jpg" alt="Job scrape" /></p>
<p> </p>
<p><strong>3. Example of a job advert scraped:</strong><br />
Fields highlighted will be extracted as per instructions below.</p>
<p><img src="http://www.webspidermount.com/imglib/demo/jobtext.jpg" alt="Job content" /></p>
<p> </p>
<p><strong>4. Source of the job to parse: </strong><br />
HTML and Javascript tags are used to identify job content.</p>
<p><img src="http://www.webspidermount.com/imglib/demo/jobxml.jpg" alt="job html" /></p>
<p> </p>
<p><strong>5. Job Spider configuration instructions for parsing:</strong><br />
Regular expressions are used for flexible content extraction from HTML source.</p>
<p><img src="http://www.webspidermount.com/imglib/demo/jbparse.jpg" alt="Parsing rules" /></p>
<p> </p>
<p><strong>6. Resulting XML to be auto-posted to your job board interface:</strong><br />
Match XML file to your job board fields for correct posting.</p>
<p><img src="http://www.webspidermount.com/imglib/demo/jobxmlresult.jpg" alt="Job XML" /></p>
]]></content:encoded>
			<wfw:commentRss>http://www.webspidermount.com/blog/job-scraping-example/job-spider/feed/</wfw:commentRss>
		</item>
		<item>
		<title>Integrate ATS With No APIs</title>
		<link>http://www.webspidermount.com/blog/integrate-ats-with-no-apis/job-spider/</link>
		<comments>http://www.webspidermount.com/blog/integrate-ats-with-no-apis/job-spider/#comments</comments>
		<pubDate>Mon, 23 Feb 2009 19:02:23 +0000</pubDate>
		<dc:creator>Valerii Verbovetsky</dc:creator>
		
		<category><![CDATA[Configuration]]></category>

		<category><![CDATA[Job Spider]]></category>

		<category><![CDATA[Applicant Tracking System]]></category>

		<category><![CDATA[ATS]]></category>

		<category><![CDATA[grab jobs]]></category>

		<category><![CDATA[Job Listing]]></category>

		<category><![CDATA[job wrapping]]></category>

		<guid isPermaLink="false">http://www.webspidermount.com/blog/?p=53</guid>
		<description><![CDATA[Job Spider is a simple option to avoid complex ATS integration. Retrieve jobs daily by opening online vacancy listings, extract job data and forward application to desired URL.
 
Some Applicant Tracking Systems do not provide API or XML export feature, but do publish vacancy listings in pre-defined formats.
 
Job Spider can be configured for grabbing the full [...]]]></description>
			<content:encoded><![CDATA[<p>Job Spider is a simple option to avoid complex ATS integration. Retrieve jobs daily by opening online vacancy listings, extract job data and forward application to desired URL.</p>
<p> </p>
<p>Some Applicant Tracking Systems do not provide API or XML export feature, but do publish vacancy listings in pre-defined formats.</p>
<p> </p>
<p>Job Spider can be configured for grabbing the full lists or selected openings, parsing the content and publishing extracted data to your career site or job board.</p>
]]></content:encoded>
			<wfw:commentRss>http://www.webspidermount.com/blog/integrate-ats-with-no-apis/job-spider/feed/</wfw:commentRss>
		</item>
	</channel>
</rss>

