| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353 | const _ = require('lodash')const stream = require('stream')const Promise = require('bluebird')const pipeline = Promise.promisify(stream.pipeline)/* global WIKI */module.exports = {  async activate() {    // not used  },  async deactivate() {    // not used  },  /**   * INIT   */  async init() {    WIKI.logger.info(`(SEARCH/ELASTICSEARCH) Initializing...`)    switch (this.config.apiVersion) {      case '7.x':        const { Client: Client7 } = require('elasticsearch7')        this.client = new Client7({          nodes: this.config.hosts.split(',').map(_.trim),          sniffOnStart: this.config.sniffOnStart,          sniffInterval: (this.config.sniffInterval > 0) ? this.config.sniffInterval : false,          name: 'wiki-js'        })        break      case '6.x':        const { Client: Client6 } = require('elasticsearch6')        this.client = new Client6({          nodes: this.config.hosts.split(',').map(_.trim),          sniffOnStart: this.config.sniffOnStart,          sniffInterval: (this.config.sniffInterval > 0) ? this.config.sniffInterval : false,          name: 'wiki-js'        })        break      default:        throw new Error('Unsupported version of elasticsearch! Update your settings in the Administration Area.')    }    // -> Create Search Index    await this.createIndex()    WIKI.logger.info(`(SEARCH/ELASTICSEARCH) Initialization completed.`)  },  /**   * Create Index   */  async createIndex() {    try {      const indexExists = await this.client.indices.exists({ index: this.config.indexName })      if (!indexExists.body) {        WIKI.logger.info(`(SEARCH/ELASTICSEARCH) Creating index...`)        try {          const idxBody = {            properties: {              suggest: { type: 'completion' },              title: { type: 'text', boost: 10.0 },              description: { type: 'text', boost: 3.0 },              content: { type: 'text', boost: 1.0 },              locale: { type: 'keyword' },              path: { type: 'text' },              tags: { type: 'text', boost: 8.0 }            }          }          await this.client.indices.create({            index: this.config.indexName,            body: {              mappings: (this.config.apiVersion === '6.x') ? {                _doc: idxBody              } : idxBody,              settings: {                analysis: {                  analyzer: {                    default: {                      type: this.config.analyzer                    }                  }                }              }            }          })        } catch (err) {          WIKI.logger.error(`(SEARCH/ELASTICSEARCH) Create Index Error: `, _.get(err, 'meta.body.error', err))        }      }    } catch (err) {      WIKI.logger.error(`(SEARCH/ELASTICSEARCH) Index Check Error: `, _.get(err, 'meta.body.error', err))    }  },  /**   * QUERY   *   * @param {String} q Query   * @param {Object} opts Additional options   */  async query(q, opts) {    try {      const results = await this.client.search({        index: this.config.indexName,        body: {          query: {            simple_query_string: {              query: `*${q}*`,              fields: ['title^20', 'description^3', 'tags^8', 'content^1'],              default_operator: 'and',              analyze_wildcard: true            }          },          from: 0,          size: 50,          _source: ['title', 'description', 'path', 'locale'],          suggest: {            suggestions: {              text: q,              completion: {                field: 'suggest',                size: 5,                skip_duplicates: true,                fuzzy: true              }            }          }        }      })      return {        results: _.get(results, 'body.hits.hits', []).map(r => ({          id: r._id,          locale: r._source.locale,          path: r._source.path,          title: r._source.title,          description: r._source.description        })),        suggestions: _.reject(_.get(results, 'suggest.suggestions', []).map(s => _.get(s, 'options[0].text', false)), s => !s),        totalHits: _.get(results, 'body.hits.total.value', _.get(results, 'body.hits.total', 0))      }    } catch (err) {      WIKI.logger.warn('Search Engine Error: ', _.get(err, 'meta.body.error', err))    }  },  /**   * Build tags field   * @param id   * @returns {Promise<*|*[]>}   */  async buildTags(id) {    const tags = await WIKI.models.pages.query().findById(id).select('*').withGraphJoined('tags')    return (tags.tags && tags.tags.length > 0) ? tags.tags.map(function (tag) {      return tag.title    }) : []  },  /**   * Build suggest field   */  buildSuggest(page) {    return _.reject(_.uniq(_.concat(      page.title.split(' ').map(s => ({        input: s,        weight: 10      })),      page.description.split(' ').map(s => ({        input: s,        weight: 3      })),      page.safeContent.split(' ').map(s => ({        input: s,        weight: 1      }))    )), ['input', ''])  },  /**   * CREATE   *   * @param {Object} page Page to create   */  async created(page) {    await this.client.index({      index: this.config.indexName,      type: '_doc',      id: page.hash,      body: {        suggest: this.buildSuggest(page),        locale: page.localeCode,        path: page.path,        title: page.title,        description: page.description,        content: page.safeContent,        tags: await this.buildTags(page.id)      },      refresh: true    })  },  /**   * UPDATE   *   * @param {Object} page Page to update   */  async updated(page) {    await this.client.index({      index: this.config.indexName,      type: '_doc',      id: page.hash,      body: {        suggest: this.buildSuggest(page),        locale: page.localeCode,        path: page.path,        title: page.title,        description: page.description,        content: page.safeContent,        tags: await this.buildTags(page.id)      },      refresh: true    })  },  /**   * DELETE   *   * @param {Object} page Page to delete   */  async deleted(page) {    await this.client.delete({      index: this.config.indexName,      type: '_doc',      id: page.hash,      refresh: true    })  },  /**   * RENAME   *   * @param {Object} page Page to rename   */  async renamed(page) {    await this.client.delete({      index: this.config.indexName,      type: '_doc',      id: page.hash,      refresh: true    })    await this.client.index({      index: this.config.indexName,      type: '_doc',      id: page.destinationHash,      body: {        suggest: this.buildSuggest(page),        locale: page.destinationLocaleCode,        path: page.destinationPath,        title: page.title,        description: page.description,        content: page.safeContent,        tags: await this.buildTags(page.id)      },      refresh: true    })  },  /**   * REBUILD INDEX   */  async rebuild() {    WIKI.logger.info(`(SEARCH/ELASTICSEARCH) Rebuilding Index...`)    await this.client.indices.delete({ index: this.config.indexName })    await this.createIndex()    const MAX_INDEXING_BYTES = 10 * Math.pow(2, 20) - Buffer.from('[').byteLength - Buffer.from(']').byteLength // 10 MB    const MAX_INDEXING_COUNT = 1000    const COMMA_BYTES = Buffer.from(',').byteLength    let chunks = []    let bytes = 0    const processDocument = async (cb, doc) => {      try {        if (doc) {          const docBytes = Buffer.from(JSON.stringify(doc)).byteLength          doc['tags'] = await this.buildTags(doc.realId)          // -> Current batch exceeds size limit, flush          if (docBytes + COMMA_BYTES + bytes >= MAX_INDEXING_BYTES) {            await flushBuffer()          }          if (chunks.length > 0) {            bytes += COMMA_BYTES          }          bytes += docBytes          chunks.push(doc)          // -> Current batch exceeds count limit, flush          if (chunks.length >= MAX_INDEXING_COUNT) {            await flushBuffer()          }        } else {          // -> End of stream, flush          await flushBuffer()        }        cb()      } catch (err) {        cb(err)      }    }    const flushBuffer = async () => {      WIKI.logger.info(`(SEARCH/ELASTICSEARCH) Sending batch of ${chunks.length}...`)      try {        await this.client.bulk({          index: this.config.indexName,          body: _.reduce(chunks, (result, doc) => {            result.push({              index: {                _index: this.config.indexName,                _type: '_doc',                _id: doc.id              }            })            doc.safeContent = WIKI.models.pages.cleanHTML(doc.render)            result.push({              suggest: this.buildSuggest(doc),              tags: doc.tags,              locale: doc.locale,              path: doc.path,              title: doc.title,              description: doc.description,              content: doc.safeContent            })            return result          }, []),          refresh: true        })      } catch (err) {        WIKI.logger.warn('(SEARCH/ELASTICSEARCH) Failed to send batch to elasticsearch: ', err)      }      chunks.length = 0      bytes = 0    }    // Added real id in order to fetch page tags from the query    await pipeline(      WIKI.models.knex.column({ id: 'hash' }, 'path', { locale: 'localeCode' }, 'title', 'description', 'render', { realId: 'id' }).select().from('pages').where({        isPublished: true,        isPrivate: false      }).stream(),      new stream.Transform({        objectMode: true,        transform: async (chunk, enc, cb) => processDocument(cb, chunk),        flush: async (cb) => processDocument(cb)      })    )    WIKI.logger.info(`(SEARCH/ELASTICSEARCH) Index rebuilt successfully.`)  }}
 |