
View on GitHub


1 hr
Test Coverage
 * @file Mongoose {@link scrapper} Schema definitions
 * @author based on whatever its take to suceed boilerplate by Trevis Gulby

const mongoose = require('mongoose');
let mongoaddr = 'mongodb://localhost:27017/test3';
mongoaddr = process.env.MONGO ? process.env.MONGO : mongoaddr;

/** The request model (to get rss feeds)
 * @constructor
 * @memberof module:models~
 * @property {String} host in fact its for now the yahoo api for rss to json
 * @property {String} path the path like /param=tto&otherparam=tonton
 * @property {Number} __v the mongoose version system
const RequestSchemas = new mongoose.Schema({
    host: {
        type: String,
        required: true,
        trim: true,
    path: {
        type: String,
        required: true,
        trim: true,
    __v: {
        type: Number,
        select: false,
    _id: false,

/** The parsing model (to remove html markup and other garbage from feeds)
 * @constructor
 * @memberof module:models~
 * @property {String} regex the user submited regex for cleaning content
const ParsingSchemas = new mongoose.Schema({
    regex: {
        type: String,
        required: true,
    name: {
        type: String,
        default: 'DEF',
        required: false,
    __v: {
        type: Number,
        select: false,
    _id: false,

/** The scrapper sources schemas
 * @constructor
 * @memberof module:models~
 * @property {String} name the name of the feed like cointelegraph, cryptonews..
 * @property {String} url the feed url (must be linked with req.path)
 * @property {Object} req the req model to call rss > json yahoo api
 * @property {Object} parse the regex for cleaning feed
 * @property {Number} __v the mongoose version system
const SourcesSchema = new mongoose.Schema({
    name: {
        type: String,
        required: true,
        trim: true,
    fname: {
        type: String,
        required: false,
        trim: true,
    url: {
        type: String,
        required: true,
        trim: true,
    req: {
        type: RequestSchemas,
        required: true,
    parse: {
        type: ParsingSchemas,
        required: false,
    __v: {
        type: Number,
        select: false,

/** The SourcesSchema.fname custom setter
 * @param {String} fname the fname to be timestamped
 * @return {String} fname + timestamp + .json
SourcesSchema.path('fname').set(function (fname) {
    const date = new Date();
    let tmpst = (date.getDate() + 1) < 10 ?
        '0' + (date.getDate() + 1) :
        date.getDate() + 1;
    tmpst += (date.getMonth() + 1) < 10 ?
        '0' + (date.getMonth() + 1) :
        date.getMonth() + 1;
    tmpst += date.getFullYear();
    tmpst += '_' + date.getHours() + '-';
    tmpst += date.getMinutes() < 10 ?
        '0' + date.getMinutes() + '.json' :
        date.getMinutes() + '.json';
    fname = fname + tmpst;
    /* eslint no-invalid-this: 0 */
    return this.fname = fname;

/** The Scrapper schemas
 * @constructor
 * @memberof module:models~
const ScrapperSchemas = new mongoose.Schema({
    name: {
        type: String,
        required: true,
        trim: true,
    Sources: {
        Bank: {
            infos: [SourcesSchema],
            prices: [SourcesSchema],
            other: [SourcesSchema],
        Crypto: {
            infos: [SourcesSchema],
            prices: [SourcesSchema],
            other: [SourcesSchema],
        Markets: {
            infos: [SourcesSchema],
            prices: [SourcesSchema],
            other: [SourcesSchema],
        Other: {
            infos: [SourcesSchema],
            prices: [SourcesSchema],
            other: [SourcesSchema],
    Date: {
        type: Date,

/** Add a new Source object to a Scrapper
 * @param {Object} uinput the user inputs and param see below
 * @param {String} uinput.scrapperid the user scrapper to update
 * @param {String} uinput.sourcegenre from enum ['Bank', 'Crypto', 'Markets']
 * @param {String} uinput.sourcetype the source type (is feed, price or other ?)
 * @param {String} uinput.sourcename the source name
 * @param {String} uinput.sourceurl the source url
 * @param {String} uinput.sourcereqhost the source https base req host
 * @param {String} uinput.sourcereqpath the source https base req path
 * @param {function} callback to get the result data or error
 * @todo format insertion format before calling this function
 * @memberof module:models~ScrapperSchemas
ScrapperSchemas.statics.addsource = (uinput, callback) => {
    let Sources = mongoose.model('Sources', SourcesSchema);
    let whatsource = 'Sources.' + uinput.sourcegenre + '.' + uinput.sourcetype;
    let newsource = {
        name: uinput.sourcename,
        url: uinput.sourceurl,
        req: {
            host: uinput.sourcereqhost,
            path: uinput.sourcereqpath,
        parse: {
            regex: uinput.sourceregex,
    Sources.create(newsource, (error, source) => {
        let elemtype = {};
        elemtype[whatsource] = source;
        if (error) throw error;
                _id: uinput.scrapperid,
            }, {
                $push: elemtype,
            (error, success) => {
                if (error) {
                    callback && callback(error);
                } else {
                    callback && callback(null, success);

/** Attaching methods to a db object ?
 * @param {String} mess
 * @return {String} clean
ParsingSchemas.statics.getptag = (mess) => {
    let clean = mess.match(/<p>(.*?)<\/p>/g);
    clean = !clean ?
        'PARSING-ERROR: No <p> tag(s) found' :
        clean.toString().replace(/<\/?p>/g, '');
    return clean;

/** Getters for schemas => tojson */
ScrapperSchemas.set('toJSON', {getters: true, virtuals: false});
/** Getters for schemas => tojson */
SourcesSchema.set('toJSON', {getters: true, virtuals: false});
/** Getters for schemas => tojson */
RequestSchemas.set('toJSON', {getters: true, virtuals: false});

let Scrapper = mongoose.model('Scrapper', ScrapperSchemas);
let Parseur = mongoose.model('Parseur', ParsingSchemas);
let Request = mongoose.model('Request', RequestSchemas);
let Source = mongoose.model('Source', SourcesSchema);

module.exports = Scrapper;
module.exports.Parseur = Parseur;
module.exports.Request = Request;
module.exports.Source = Source;