Friday, 11 August 2023

html code for Scan PDF links from web pages

 <!DOCTYPE html>



<title>Extract PDF Links</title>


function extractPDFLinks() {

  // Get the webpage link from the form.

  var webpageLink = document.getElementById("webpageLink").value;

  // Create an array to store the PDF links.

  var pdfLinks = [];

  // Get all the anchor tags on the page.

  var anchorTags = document.getElementsByTagName("a");

  // Loop through the anchor tags and check if they point to PDF files.

  for (var i = 0; i < anchorTags.length; i++) {

    var link = anchorTags[i];

    // Get the link's href attribute.

    var href = link.href;

    // Check if the href attribute ends with .pdf.

    if (href.endsWith('.pdf')) {

      // Add the link to the PDF links array.




  // Create a div to display the PDF links.

  var div = document.createElement('div');

  div.setAttribute('id', 'pdf-links');

  // Loop through the PDF links and add them to the div.

  for (var i = 0; i < pdfLinks.length; i++) {

    var link = pdfLinks[i];

    // Get the link's text.

    var text = link.textContent;

    // Create a span element to display the link's text.

    var span = document.createElement('span');

    span.textContent = text;

    // Create a button element to download the link's file.

    var button = document.createElement('button');

    button.textContent = 'Download';

    button.addEventListener('click', function() {

      window.location.href = link.href;


    // Add the span and button elements to the div.




  // Append the div to the document body.






<h1>Extract PDF Links</h1>


  <input type="text" id="webpageLink" placeholder="Enter the webpage link">

  <button type="button" onclick="extractPDFLinks()">Extract PDF Links</button>


<div id="pdf-links"></div>