Puppeteer node.js: Access denied when downloading image

1.1k Views Asked by At

I'm trying to download an image using the fs.createWriteStream function. I'm able to download the image but it's damaged/corrupted.I'm getting an error message saying: "Access Denied You don't have permission to access "https:..." on this server"

I'm using puppeteer on headless:false mode and I also set the user agent to: "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/61.0.3163.100 Safari/537.36")

The function I'm calling to download the file is the following:

const https = require("https");
const http = require("http");
const fs = require ("fs");
const path = require("path");
const URL = require("url").URL;

function download (url, filepath,callback,){

    const userURL = new URL (url);
    const requestCaller = userURL.protocol === "http:" ? http : https;

    const filename = path.basename(url);
  
    const req = requestCaller.get(url, function(res){

         const fileStream = fs.createWriteStream(path.resolve(filepath,filename));
         res.pipe(fileStream);

            fileStream.on("error", function(err){
                console.log("Error writing to the stream.");
                console.log(err);
              });
            fileStream.on("close",function(){
                callback(filename);

            });

            fileStream.on("finish", function(){
                fileStream.close()
            });
        });
         req.on("error", function(err){
             console.log("Error downloading the file.");
             console.log(err);  
         });
         
     };

   module.exports.download = download;

The URL of the image I'm trying to download is this:

https://www.vrisko.gr/logos/775165.jpg

It seems I'm getting blocked by the server but I don't know what else to do apart from setting the user agent and not running puppeteer in headless mode. Any thoughts?

[EDIT]

Apparently there is an issue with the CORS policy. I checked the Network call and I see the following:

Referrer Policy: strict-origin-when-cross-origin sec-fetch-site: none

Whereas when I simply manually navigate from my browser, I get this:

Referrer Policy: unsafe-url sec-fetch-site: same-origin

Thanks a lot!

1

There are 1 best solutions below

0
On

I fixed all my errors with CORS policy by using npm module cors. Install it with 'npm install cors' and do this:

const cors = require('cors');
const app = express();
app.use(cors());
app.options('*', cors());