forked from mirror/pixelfed
64 lines
1.6 KiB
PHP
64 lines
1.6 KiB
PHP
<?php
|
|
|
|
namespace App\Jobs\AutospamPipeline;
|
|
|
|
use Illuminate\Bus\Queueable;
|
|
use Illuminate\Contracts\Queue\ShouldBeUnique;
|
|
use Illuminate\Contracts\Queue\ShouldQueue;
|
|
use Illuminate\Foundation\Bus\Dispatchable;
|
|
use Illuminate\Queue\InteractsWithQueue;
|
|
use Illuminate\Queue\SerializesModels;
|
|
use App\Util\Lexer\Classifier;
|
|
use App\AccountInterstitial;
|
|
use App\Status;
|
|
use Illuminate\Support\Facades\Storage;
|
|
use App\Services\AutospamService;
|
|
|
|
class AutospamPretrainPipeline implements ShouldQueue
|
|
{
|
|
use Dispatchable, InteractsWithQueue, Queueable, SerializesModels;
|
|
|
|
public $classifier;
|
|
|
|
/**
|
|
* Create a new job instance.
|
|
*/
|
|
public function __construct()
|
|
{
|
|
$this->classifier = new Classifier();
|
|
}
|
|
|
|
/**
|
|
* Execute the job.
|
|
*/
|
|
public function handle(): void
|
|
{
|
|
$classifier = $this->classifier;
|
|
|
|
$aiCount = AccountInterstitial::whereItemType('App\Status')
|
|
->whereIsSpam(true)
|
|
->count();
|
|
|
|
if($aiCount < 100) {
|
|
return;
|
|
}
|
|
|
|
AccountInterstitial::whereItemType('App\Status')
|
|
->whereIsSpam(true)
|
|
->inRandomOrder()
|
|
->take(config('autospam.nlp.spam_sample_limit'))
|
|
->pluck('item_id')
|
|
->each(function ($ai) use($classifier) {
|
|
$status = Status::whereNotNull('caption')->find($ai);
|
|
if(!$status) {
|
|
return;
|
|
}
|
|
$classifier->learn($status->caption, 'spam');
|
|
});
|
|
|
|
Storage::put(AutospamService::MODEL_SPAM_PATH, $classifier->export());
|
|
|
|
AutospamUpdateCachedDataPipeline::dispatch()->delay(5);
|
|
}
|
|
}
|