.net calls nsfwjs through WebAPI for video authentication function

1. npm install nsfwjs

npm install express --save
npm install multer --save
npm install jpeg-js --save
npm install @tensorflow/tfjs-node --save
npm install nsfwjs --save

Note: Python is required to install @tensorflow/tfjs-node, and it is recommended to add it to the user environment variable Path

2. Run the WebAPI service

nsfwjs author provides aSimpleTo provide WebAPI services for easy copying to this

const express = require('express')
const multer = require('multer')
const jpeg = require('jpeg-js')

const tf = require('@tensorflow/tfjs-node')
const nsfw = require('nsfwjs')

const app = express()
const upload = multer()

let _model

const convert = async (img) => {
  // Decoded image in UInt8 Byte array
  const image = await (img, true)

  const numChannels = 3
  const numPixels =  * 
  const values = new Int32Array(numPixels * numChannels)

  for (let i = 0; i < numPixels; i++)
    for (let c = 0; c < numChannels; ++c)
      values[i * numChannels + c] = [i * 4 + c]

  return tf.tensor3d(values, [, , numChannels], 'int32')
}

('/nsfw', ('image'), async (req, res) => {
  if (!) (400).send('Missing image multipart/form-data')
  else {
    const image = await convert()
    const predictions = await _model.classify(image)
    ()
    (predictions)
  }
})

const load_model = async () => {
  _model = await () //you can specify module here
}

// Keep the model in memory, make sure it's loaded only once
load_model().then(() => (8080))

Try running this service (note that this app only supports pictures in jpeg format)

node

Test with curl

curl --request POST localhost:8080/nsfw --header 'Content-Type: multipart/form-data' --data-binary 'image=@'

I want to be simpler, I can write it like this

curl -F "image=@" "http://localhost:8080/nsfw"

You can test it through Postman under Windows.

3. .net encapsulation call

The nsfwjs WebAPI service can run, and it is very easy to encapsulate calls with .net.

3.1 First start node through process, and the console can be hidden through output redirection

3.2 Submit the images that need to be identified through client components such as HttpClient or RestSharp, and return the results

3.3 If you want to analyze videos, you can also refer to this article: FFMPEG obtains video keyframes and saves them into jpg images (ps: introduction at the end of the article).

Implement screenshots by calling ffmpeg or using programming

The operation effect is pretty good. Pictures under 200K can generally return identification results within 200ms.

ps: Let's take a look at FFMPEG to obtain the video keyframe and save it into a jpg image

1. Command line method

Take 1 frame in 1 second r:rate

ffmpeg -i input.mp4 -f image2 -r 1 dstPath/image-%

Extract I frames

ffmpeg -i input.mp4 -an -vf select='eq(pict_type\,I)' -vsync 2 -s 720*480 -f image2 dstPath/image-%

2. Code method

Extract I frames

//source: 
#include &lt;iostream&gt;
#include &lt;cstdio&gt;
#include &lt;cstring&gt;

#define __STDC_CONSTANT_MACROS

extern "C"
{
#include &lt;libavutil/&gt;
#include &lt;libavutil/&gt;
#include &lt;libavutil/&gt;
#include &lt;libavutil/&gt;
#include &lt;libavcodec/&gt;
#include &lt;libavutil/channel_layout.h&gt;
#include &lt;libavutil/&gt;
#include &lt;libavutil/&gt;
#include &lt;libavutil/&gt;
#include &lt;libavutil/&gt;
#include &lt;libavutil/&gt;
#include &lt;libavformat/&gt;
#include &lt;libswscale/&gt;
#include &lt;&gt;
}

using namespace std;

char errbuf[256];
char timebuf[256];
static AVFormatContext *fmt_ctx = NULL;
static AVCodecContext *video_dec_ctx = NULL;
static int width, height;
static enum AVPixelFormat pix_fmt;
static AVStream *video_stream = NULL;
static const char *src_filename = NULL;
static const char *output_dir = NULL;
static int video_stream_idx = -1;
static AVFrame *frame = NULL;
static AVFrame *pFrameRGB = NULL;
static AVPacket pkt;
static struct SwsContext *pSWSCtx = NULL;
static int video_frame_count = 0;

/* Enable or disable frame reference counting. You are not supposed to support
 * both paths in your application but pick the one most appropriate to your
 * needs. Look for the use of refcount in this example to see what are the
 * differences of API usage between them. */
static int refcount = 0;
static void jpg_save(uint8_t *pRGBBuffer, int iFrame, int width, int height);

static int decode_packet(int *got_frame, int cached)
{
    int ret = 0;
    int decoded = ;
    *got_frame = 0;

    if (pkt.stream_index == video_stream_idx)
    {
        /* decode video frame */
        ret = avcodec_decode_video2(video_dec_ctx, frame, got_frame, &amp;pkt);
        if (ret &lt; 0)
        {
            fprintf(stderr, "Error decoding video frame (%s)\n", av_make_error_string(errbuf, sizeof(errbuf), ret));
            return ret;
        }
        if (*got_frame)
        {
            if (frame-&gt;width != width || frame-&gt;height != height ||
                frame-&gt;format != pix_fmt)
            {
                /* To handle this change, one could call av_image_alloc again and
                 * decode the following frames into another rawvideo file. */
                fprintf(stderr, "Error: Width, height and pixel format have to be "
                                "constant in a rawvideo file, but the width, height or "
                                "pixel format of the input video changed:\n"
                                "old: width = %d, height = %d, format = %s\n"
                                "new: width = %d, height = %d, format = %s\n",
                        width, height, av_get_pix_fmt_name(pix_fmt),
                        frame-&gt;width, frame-&gt;height,
                        av_get_pix_fmt_name(frame-&gt;format));
                return -1;
            }

            video_frame_count++;
            static int iFrame = 0;
            if (frame-&gt;key_frame == 1) //If it is a keyframe            {
                sws_scale(pSWSCtx, frame-&gt;data, frame-&gt;linesize, 0,
                          video_dec_ctx-&gt;height,
                          pFrameRGB-&gt;data, pFrameRGB-&gt;linesize);
                // Save to disk                iFrame++;
                jpg_save(pFrameRGB-&gt;data[0], iFrame, width, height);
            }
        }
    }
    /* If we use frame reference counting, we own the data and need
     * to de-reference it when we don't use it anymore */
    if (*got_frame &amp;&amp; refcount)
        av_frame_unref(frame);
    return decoded;
}

static int open_codec_context(int *stream_idx,
                              AVCodecContext **dec_ctx, AVFormatContext *fmt_ctx, enum AVMediaType type)
{
    int ret, stream_index;
    AVStream *st;
    AVCodec *dec = NULL;
    AVDictionary *opts = NULL;
    ret = av_find_best_stream(fmt_ctx, type, -1, -1, NULL, 0);
    if (ret &lt; 0)
    {
        fprintf(stderr, "Could not find %s stream in input file '%s'\n",
                av_get_media_type_string(type), src_filename);
        return ret;
    }
    else
    {
        stream_index = ret;
        st = fmt_ctx-&gt;streams[stream_index];
        /* find decoder for the stream */
        dec = avcodec_find_decoder(st-&gt;codecpar-&gt;codec_id);
        if (!dec)
        {
            fprintf(stderr, "Failed to find %s codec\n",
                    av_get_media_type_string(type));
            return AVERROR(EINVAL);
        }
        /* Allocate a codec context for the decoder */
        *dec_ctx = avcodec_alloc_context3(dec);
        if (!*dec_ctx)
        {
            fprintf(stderr, "Failed to allocate the %s codec context\n",
                    av_get_media_type_string(type));
            return AVERROR(ENOMEM);
        }
        /* Copy codec parameters from input stream to output codec context */
        if ((ret = avcodec_parameters_to_context(*dec_ctx, st-&gt;codecpar)) &lt; 0)
        {
            fprintf(stderr, "Failed to copy %s codec parameters to decoder context\n",
                    av_get_media_type_string(type));
            return ret;
        }
        /* Init the decoders, with or without reference counting */
        av_dict_set(&amp;opts, "refcounted_frames", refcount ? "1" : "0", 0);
        if ((ret = avcodec_open2(*dec_ctx, dec, &amp;opts)) &lt; 0)
        {
            fprintf(stderr, "Failed to open %s codec\n",
                    av_get_media_type_string(type));
            return ret;
        }
        *stream_idx = stream_index;
    }
    return 0;
}

static int get_format_from_sample_fmt(const char **fmt, enum AVSampleFormat sample_fmt)
{
    int i;
    struct sample_fmt_entry
    {
        enum AVSampleFormat sample_fmt;
        const char *fmt_be, *fmt_le;
    } sample_fmt_entries[] = {
        {AV_SAMPLE_FMT_U8, "u8", "u8"},
        {AV_SAMPLE_FMT_S16, "s16be", "s16le"},
        {AV_SAMPLE_FMT_S32, "s32be", "s32le"},
        {AV_SAMPLE_FMT_FLT, "f32be", "f32le"},
        {AV_SAMPLE_FMT_DBL, "f64be", "f64le"},
    };
    *fmt = NULL;
    for (i = 0; i &lt; FF_ARRAY_ELEMS(sample_fmt_entries); i++)
    {
        struct sample_fmt_entry *entry = &amp;sample_fmt_entries[i];
        if (sample_fmt == entry-&gt;sample_fmt)
        {
            *fmt = AV_NE(entry-&gt;fmt_be, entry-&gt;fmt_le);
            return 0;
        }
    }
    fprintf(stderr,
            "sample format %s is not supported as output format\n",
            av_get_sample_fmt_name(sample_fmt));
    return -1;
}

int main(int argc, char **argv)
{
    int ret = 0, got_frame;
    int numBytes = 0;
    uint8_t *buffer;
    if (argc != 3 &amp;&amp; argc != 4)
    {
        fprintf(stderr, "usage: %s [-refcount] input_file ouput_dir\n"
                        "API example program to show how to read frames from an input file.\n"
                        "This program reads frames from a file, decodes them, and writes bmp keyframes\n"
                        "If the -refcount option is specified, the program use the\n"
                        "reference counting frame system which allows keeping a copy of\n"
                        "the data for longer than one decode call.\n"
                        "\n",
                argv[0]);
        exit(1);
    }

    if (argc == 4 &amp;&amp; !strcmp(argv[1], "-refcount"))
    {
        refcount = 1;
        argv++;
    }

    src_filename = argv[1];
    output_dir = argv[2];

    /* open input file, and allocate format context */
    if (avformat_open_input(&amp;fmt_ctx, src_filename, NULL, NULL) &lt; 0)
    {
        fprintf(stderr, "Could not open source file %s\n", src_filename);
        exit(1);
    }

    /* retrieve stream information */
    if (avformat_find_stream_info(fmt_ctx, NULL) &lt; 0)
    {
        fprintf(stderr, "Could not find stream information\n");
        exit(1);
    }

    if (open_codec_context(&amp;video_stream_idx, &amp;video_dec_ctx, fmt_ctx, AVMEDIA_TYPE_VIDEO) &gt;= 0)
    {
        video_stream = fmt_ctx-&gt;streams[video_stream_idx];
        /* allocate image where the decoded image will be put */
        width = video_dec_ctx-&gt;width;
        height = video_dec_ctx-&gt;height;
        pix_fmt = video_dec_ctx-&gt;pix_fmt;
    }
    else
    {
        goto end;
    }

    /* dump input information to stderr */
    av_dump_format(fmt_ctx, 0, src_filename, 0);
    if (!video_stream)
    {
        fprintf(stderr, "Could not find video stream in the input, aborting\n");
        ret = 1;
        goto end;
    }

    pFrameRGB = av_frame_alloc();
    numBytes = avpicture_get_size(AV_PIX_FMT_BGR24, width, height);
    buffer = av_malloc(numBytes);
    avpicture_fill((AVPicture *)pFrameRGB, buffer, AV_PIX_FMT_BGR24, width, height);
    pSWSCtx = sws_getContext(width, height, pix_fmt, width, height, AV_PIX_FMT_RGB24, SWS_BICUBIC, NULL, NULL, NULL);

    frame = av_frame_alloc();
    if (!frame)
    {
        fprintf(stderr, "Could not allocate frame\n");
        ret = AVERROR(ENOMEM);
        goto end;
    }

    /* initialize packet, set data to NULL, let the demuxer fill it */
    av_init_packet(&amp;pkt);
     = NULL;
     = 0;

    if (video_stream)
        printf("Demuxing video from file '%s' to dir: %s\n", src_filename, output_dir);

    /* read frames from the file */
    while (av_read_frame(fmt_ctx, &amp;pkt) &gt;= 0)
    {
        AVPacket orig_pkt = pkt;
        do
        {
            ret = decode_packet(&amp;got_frame, 0);
            if (ret &lt; 0)
                break;
             += ret;
             -= ret;
        } while ( &gt; 0);
        av_packet_unref(&amp;orig_pkt);
    }

    /* flush cached frames */
     = NULL;
     = 0;

end:
    if (video_dec_ctx)
        avcodec_free_context(&amp;video_dec_ctx);
    if (fmt_ctx)
        avformat_close_input(&amp;fmt_ctx);
    if (buffer)
        av_free(buffer);
    if (pFrameRGB)
        av_frame_free(&amp;pFrameRGB);
    if (frame)
        av_frame_free(&amp;frame);
    return ret &lt; 0;
}

static void jpg_save(uint8_t *pRGBBuffer, int iFrame, int width, int height)
{

    struct jpeg_compress_struct cinfo;

    struct jpeg_error_mgr jerr;

    char szFilename[1024];
    int row_stride;

    FILE *fp;
    JSAMPROW row_pointer[1]; // One line of bitmap     = jpeg_std_error(&amp;jerr);
    jpeg_create_compress(&amp;cinfo);

    sprintf(szFilename, "%s/image-%", output_dir, iFrame); //The picture name is video name + number    fp = fopen(szFilename, "wb");

    if (fp == NULL)
        return;

    jpeg_stdio_dest(&amp;cinfo, fp);

    cinfo.image_width = width; // is the width and height of the graph, and the units are pixels    cinfo.image_height = height;
    cinfo.input_components = 3;     // Here is 1, indicating a grayscale image. If it is a color bitmap, it is 3    cinfo.in_color_space = JCS_RGB; //JCS_GRAYSCALE represents grayscale map, JCS_RGB represents color image
    jpeg_set_defaults(&amp;cinfo);
    jpeg_set_quality(&amp;cinfo, 80, 1);

    jpeg_start_compress(&amp;cinfo, TRUE);

    row_stride = cinfo.image_width * 3; //The number of bytes in each row, if it is not an index graph, you need to multiply by 3 here
    // Compress each line    while (cinfo.next_scanline &lt; cinfo.image_height)
    {
        row_pointer[0] = &amp;(pRGBBuffer[cinfo.next_scanline * row_stride]);
        jpeg_write_scanlines(&amp;cinfo, row_pointer, 1);
    }

    jpeg_finish_compress(&amp;cinfo);
    jpeg_destroy_compress(&amp;cinfo);

    fclose(fp);
}
cat Makefile
keyframe:
	g++ $&lt; -o $@ `pkg-config --libs libavcodec libavformat libswscale libavutil` -ljpeg -fpermissive

This is the article about .net video identification through WebAPI calling nsfwjs. This is all about this. For more related .net WebAPI video identification content, please search for my previous articles or continue browsing the related articles below. I hope everyone will support me in the future!