HEX
Server: nginx/1.27.0
System: Linux 20d173156d2c 6.8.0-88-generic #89-Ubuntu SMP PREEMPT_DYNAMIC Sat Oct 11 01:02:46 UTC 2025 x86_64
User: www-data (33)
PHP: 8.1.29
Disabled: NONE
Upload Files
File: /var/www/html/wp-content/plugins/content-egg/application/libs/KeywordDensity.php
<?php

namespace ContentEgg\application\libs;

defined('\ABSPATH') || exit;

use ContentEgg\application\libs\stopwords\StopWords;

//use ContentEgg\application\libs\stemmer\Stemmer;

/**
 * KeywordDensity class file
 *
 * @author keywordrush.com <support@keywordrush.com>
 * @link https://www.keywordrush.com
 * @copyright Copyright &copy; 2025 keywordrush.com
 *
 */
class KeywordDensity
{

	private $stemmer_normalisation = false;
	private $lang = 'en';   //en|ru|fr|de|...
	private $text = '';
	private $words = array();
	private $stemmer = null; // stemmer instance
	private $stop_words = null;
	private $words_rank = null;

	public function __construct($lang = 'en')
	{
		$this->lang = $lang;
	}

	public function getStemmer()
	{
		if ($this->stemmer == null)
		{
			require_once dirname(__FILE__) . DIRECTORY_SEPARATOR . 'stemmer' . DIRECTORY_SEPARATOR . 'Stemmer.php';
			if (Stemmer::isLangAvailable($this->lang))
			{
				$this->stemmer = new Stemmer($this->lang);
			}
			else
			{
				$this->stemmer = false;
			}
		}

		return $this->stemmer;
	}

	public function SetStemmer($stemmer)
	{
		$this->stemmer = $stemmer;
	}

	public function getStopWords()
	{
		if ($this->stop_words == null)
		{
			require_once dirname(__FILE__) . DIRECTORY_SEPARATOR . 'stopwords' . DIRECTORY_SEPARATOR . 'StopWords.php';
			if (StopWords::isLangAvailable($this->lang))
			{
				$sw               = new StopWords($this->lang);
				$this->stop_words = $sw->words($this->lang);
			}
			else
			{
				$this->stop_words = array();
			}
		}

		return $this->stop_words;
	}

	public function setText($text)
	{
		$this->text  = strip_tags($text);
		$this->words = null;
	}

	public function setStemmerNormalisatiom($value)
	{
		$this->stemmer_normalisation = (bool) $value;
	}

	public function getPopularWords($max = null)
	{
		$this->splitWords();
		$this->words_rank = array_count_values($this->words);
		arsort($this->words_rank);
		if ($max)
		{
			return array_keys(array_slice($this->words_rank, 0, $max));
		}
		else
		{
			return array_keys($this->words_rank);
		}
	}

	private function splitWords()
	{
		$this->words = array();
		preg_match_all("/\pL+/ui", $this->text, $m);
		foreach ($m[0] as $word)
		{
			$word = $this->prepareWord($word);
			if (!$word)
			{
				continue;
			}

			$this->words[] = $word;
		}
	}

	public function prepareWord($word)
	{
		$word = mb_strtolower($word, 'UTF-8');

		if (in_array($word, $this->getStopWords()))
		{
			return false;
		}

		if (!ctype_digit($word) && mb_strlen($word, 'UTF-8') <= 1)
		{
			return false;
		}

		if ($this->stemmer_normalisation)
		{
			$stemmer = $this->getStemmer();
			if ($stemmer)
			{
				$word = $stemmer->stem($word);
			}
		}

		return $word;
	}
}