Skip to content
Open
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
156 changes: 156 additions & 0 deletions lib/Logger.js
Original file line number Diff line number Diff line change
@@ -0,0 +1,156 @@
const fs = require('fs');
const path = require('path');

/**
* Advanced logging utility for web scraping activities
* Supports console and file-based logging with detailed error tracking
*/
class Logger {
/**
* Creates a new Logger instance
* @param {Object} options - Logger configuration options
* @param {string} [options.level='info'] - Logging level (debug, info, warn, error)
* @param {boolean} [options.enabled=true] - Enable/disable logging
* @param {string} [options.logFile] - Path to log file for persistent logging
*/
constructor(options = {}) {
this.level = options.level || 'info';
this.enabled = options.enabled !== false;
this.logFile = options.logFile || path.join(process.cwd(), 'scraper.log');
this.logLevels = ['debug', 'info', 'warn', 'error'];
}

/**
* Generate a timestamp for logging
* @returns {string} Formatted timestamp
*/
_getTimestamp() {
return new Date().toISOString();
}

/**
* Write log message to file
* @param {string} level - Log level
* @param {string} message - Log message
* @param {Object} [metadata] - Additional logging metadata
*/
_writeToFile(level, message, metadata = {}) {
if (!this.logFile) return;

const logEntry = JSON.stringify({
timestamp: this._getTimestamp(),
level,
message,
metadata
}) + '\n';

try {
fs.appendFileSync(this.logFile, logEntry);
} catch (error) {
console.error('Failed to write to log file:', error);
}
}

/**
* Check if a log level is enabled
* @param {string} level - Log level to check
* @returns {boolean} Whether the log level is enabled
*/
isLevelEnabled(level) {
const currentLevelIndex = this.logLevels.indexOf(this.level);
const checkLevelIndex = this.logLevels.indexOf(level);
return checkLevelIndex >= currentLevelIndex;
}

/**
* Log a successful page fetch
* @param {string} url - URL of the fetched page
* @param {Object} [details] - Additional fetch details
*/
logPageFetch(url, details = {}) {
if (!this.enabled || !this.isLevelEnabled('info')) return;

const message = `Page fetched successfully: ${url}`;
const metadata = {
url,
...details
};

console.log(`[INFO] ${message}`, metadata);
this._writeToFile('info', message, metadata);
}

/**
* Log a network or parsing error
* @param {string} type - Error type (network, parsing)
* @param {string} url - URL associated with the error
* @param {Error} error - The error object
* @param {Object} [details] - Additional error details
*/
logError(type, url, error, details = {}) {
if (!this.enabled || !this.isLevelEnabled('error')) return;

const message = `${type.toUpperCase()} Error: ${error.message}`;
const metadata = {
type,
url,
errorName: error.name,
errorMessage: error.message,
stack: error.stack,
...details
};

console.error(`[ERROR] ${message}`, metadata);
this._writeToFile('error', message, metadata);
}

/**
* Debug level logging
* @param {string} message - Log message
* @param {Object} [metadata] - Optional additional logging metadata
*/
debug(message, metadata = {}) {
if (!this.enabled || !this.isLevelEnabled('debug')) return;

console.log(`[DEBUG] ${message}`, metadata);
this._writeToFile('debug', message, metadata);
}

/**
* Info level logging
* @param {string} message - Log message
* @param {Object} [metadata] - Optional additional logging metadata
*/
info(message, metadata = {}) {
if (!this.enabled || !this.isLevelEnabled('info')) return;

console.log(`[INFO] ${message}`, metadata);
this._writeToFile('info', message, metadata);
}

/**
* Warning level logging
* @param {string} message - Log message
* @param {Object} [metadata] - Optional additional logging metadata
*/
warn(message, metadata = {}) {
if (!this.enabled || !this.isLevelEnabled('warn')) return;

console.warn(`[WARN] ${message}`, metadata);
this._writeToFile('warn', message, metadata);
}

/**
* Error level logging
* @param {string} message - Log message
* @param {Object} [metadata] - Optional additional logging metadata
*/
error(message, metadata = {}) {
if (!this.enabled || !this.isLevelEnabled('error')) return;

console.error(`[ERROR] ${message}`, metadata);
this._writeToFile('error', message, metadata);
}
}

module.exports = Logger;
12 changes: 9 additions & 3 deletions package.json
Original file line number Diff line number Diff line change
Expand Up @@ -25,10 +25,16 @@
},
"devDependencies": {
"jscs": ">=3.0.2",
"nodeunit": "0.11.3"
"nodeunit": "0.11.3",
"jest": "^29.7.0"
},
"scripts": {
"test": "node ./node_modules/.bin/nodeunit test"
"test": "jest",
"test:watch": "jest --watch"
},
"jest": {
"testEnvironment": "node",
"verbose": true
},
"license": "MIT",
"main": "index",
Expand All @@ -39,4 +45,4 @@
"bugs": {
"url": "https://github.com/rchipka/node-osmosis/issues"
}
}
}
124 changes: 124 additions & 0 deletions test/Logger.test.js
Original file line number Diff line number Diff line change
@@ -0,0 +1,124 @@
const fs = require('fs');
const path = require('path');
const Logger = require('../lib/Logger');

describe('Logger', () => {
let consoleSpy;
let testLogFile;

beforeEach(() => {
// Create a unique test log file for each test
testLogFile = path.join(process.cwd(), `test-${Date.now()}.log`);

consoleSpy = {
log: jest.spyOn(console, 'log').mockImplementation(),
warn: jest.spyOn(console, 'warn').mockImplementation(),
error: jest.spyOn(console, 'error').mockImplementation()
};
});

afterEach(() => {
// Restore console methods
consoleSpy.log.mockRestore();
consoleSpy.warn.mockRestore();
consoleSpy.error.mockRestore();

// Remove test log file if it exists
if (fs.existsSync(testLogFile)) {
fs.unlinkSync(testLogFile);
}
});

test('logPageFetch logs successful page fetch', () => {
const logger = new Logger({
level: 'info',
logFile: testLogFile
});
const testUrl = 'https://example.com';

logger.logPageFetch(testUrl, { statusCode: 200 });

// Check console output
expect(consoleSpy.log).toHaveBeenCalledWith(
expect.stringContaining('[INFO]'),
expect.objectContaining({
url: testUrl,
statusCode: 200
})
);

// Check log file content
const logContent = fs.readFileSync(testLogFile, 'utf-8');
const logEntry = JSON.parse(logContent.trim());

expect(logEntry).toMatchObject({
level: 'info',
message: `Page fetched successfully: ${testUrl}`,
metadata: {
url: testUrl,
statusCode: 200
}
});
});

test('logError logs network and parsing errors', () => {
const logger = new Logger({
level: 'error',
logFile: testLogFile
});
const testUrl = 'https://example.com';
const testError = new Error('Connection timeout');

logger.logError('network', testUrl, testError, { retryCount: 1 });

// Check console output
expect(consoleSpy.error).toHaveBeenCalledWith(
expect.stringContaining('[ERROR]'),
expect.objectContaining({
type: 'network',
url: testUrl,
errorMessage: 'Connection timeout',
retryCount: 1
})
);

// Check log file content
const logContent = fs.readFileSync(testLogFile, 'utf-8');
const logEntry = JSON.parse(logContent.trim());

expect(logEntry).toMatchObject({
level: 'error',
message: 'NETWORK Error: Connection timeout',
metadata: {
type: 'network',
url: testUrl,
errorName: 'Error',
errorMessage: 'Connection timeout',
retryCount: 1
}
});
expect(logEntry.metadata.stack).toBeDefined();
});

test('logger respects log level configuration', () => {
const logger = new Logger({
level: 'warn',
logFile: testLogFile
});

// These should not log
logger.debug('Debug message');
logger.info('Info message');

// This should log
logger.warn('Warning message', { context: 'test' });

// Check console output
expect(consoleSpy.log).not.toHaveBeenCalled();
expect(consoleSpy.error).not.toHaveBeenCalled();
expect(consoleSpy.warn).toHaveBeenCalledWith(
expect.stringContaining('[WARN]'),
{ context: 'test' }
);
});
});