Blame view

src/main.cpp 7.48 KB
aac5773f   hucm   功能基本完成,接口待打磨
1
2
3
  #include "FFNvDecoderManager.h"
  #include <iostream>
  
e41a52bb   Hu Chunming   1.优化数据读取线程;2. 添加A...
4
5
6
7
  #include "cuda_kernels.h"
  
  #include "NvJpegEncoder.h"
  
f40cc409   Hu Chunming   优化显存占用。当前在3080显卡上...
8
9
10
11
12
  #include <pthread.h>
  #include <thread>
  
  #include <chrono>
  
e41a52bb   Hu Chunming   1.优化数据读取线程;2. 添加A...
13
14
  unsigned char *pHwRgb = nullptr;
  
0b43216c   Hu Chunming   添加重要注释
15
16
17
  /**
   * 注意: gpuFrame 在解码器设置的显卡上,后续操作要十分注意这一点,尤其是多线程情况
   * */
aac5773f   hucm   功能基本完成,接口待打磨
18
19
20
21
  void postDecoded(const void * userPtr, AVFrame * gpuFrame){
      FFNvDecoder* decoder = (FFNvDecoder*)userPtr;
      if (decoder!= nullptr)
      {
f40cc409   Hu Chunming   优化显存占用。当前在3080显卡上...
22
23
24
25
26
27
28
          // cout << "decode name: " << decoder->getName() << endl;
  
          if (decoder->getName() == "dec1")
          {
              /* code */
          }
          
48330793   Hu Chunming   修正解码线程自然结束时解码器内存没...
29
30
          // const char* gpu_pixfmt = av_get_pix_fmt_name((AVPixelFormat)gpuFrame->format);
          // cout << "pixfmt: " << gpu_pixfmt << endl;
f40cc409   Hu Chunming   优化显存占用。当前在3080显卡上...
31
          // cout << "keyframe: " << gpuFrame->key_frame << " width: " << gpuFrame->width << " height: "<< gpuFrame->height << endl;
48330793   Hu Chunming   修正解码线程自然结束时解码器内存没...
32
          // cout << "decode successed ✿✿ヽ(°▽°)ノ✿ " << endl;
e41a52bb   Hu Chunming   1.优化数据读取线程;2. 添加A...
33
34
  
          if (gpuFrame->format == AV_PIX_FMT_CUDA)
7319ea36   Hu Chunming   多显卡设置
35
          {   
f40cc409   Hu Chunming   优化显存占用。当前在3080显卡上...
36
              // cout << "gpuid = " << atoi(decoder->m_cfg.gpuid.c_str()) << endl;
7319ea36   Hu Chunming   多显卡设置
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
              // cudaSetDevice(atoi(decoder->m_cfg.gpuid.c_str()));
              // cudaError_t cudaStatus;
              // if(pHwRgb == nullptr){
              //     cuda_common::setColorSpace2( ITU709, 0 );
              //     cudaStatus = cudaMalloc((void **)&pHwRgb, 3 * gpuFrame->width * gpuFrame->height * sizeof(unsigned char));
              // }
              // cudaStatus = cuda_common::CUDAToBGR((CUdeviceptr)gpuFrame->data[0],(CUdeviceptr)gpuFrame->data[1], gpuFrame->linesize[0], gpuFrame->linesize[1], pHwRgb, gpuFrame->width, gpuFrame->height);
              // cudaDeviceSynchronize();
              // if (cudaStatus != cudaSuccess) {
              //     cout << "CUDAToBGR failed !!!" << endl;
              //     return;
              // }
  
              // string path = "/home/cmhu/FFNvDecoder/" + decoder->m_cfg.gpuid + ".jpg";
              // saveJpeg(path.c_str(), pHwRgb, gpuFrame->width, gpuFrame->height);  // 验证 CUDAToRGB 
e41a52bb   Hu Chunming   1.优化数据读取线程;2. 添加A...
52
          }
aac5773f   hucm   功能基本完成,接口待打磨
53
54
55
      }
  }
  
f40cc409   Hu Chunming   优化显存占用。当前在3080显卡上...
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
  long start_time = 0;
  long end_time = 0;
  bool count_flag = false;
  int count = 0;
  int count_std = 100;
  
  long long get_cur_time(){
      // 获取操作系统当前时间点(精确到微秒)
      chrono::time_point<chrono::system_clock, chrono::microseconds> tpMicro
          = chrono::time_point_cast<chrono::microseconds>(chrono::system_clock::now());
      // (微秒精度的)时间点 => (微秒精度的)时间戳
      time_t totalMicroSeconds = tpMicro.time_since_epoch().count();
  
  	long long currentTime = ((long long)totalMicroSeconds)/1000;
  
      return currentTime;
  }
  
  int sum = 0;
  void postDecoded0(const void * userPtr, AVFrame * gpuFrame){
      FFNvDecoder* decoder = (FFNvDecoder*)userPtr;
      if (decoder!= nullptr)
      {
          // cout << "decode name: " << decoder->getName() << endl;
          if (decoder->getName() == "dec")
          {
              if (! count_flag)
              {
                  count_flag = true;
                  count = 0;
                  end_time = start_time = get_cur_time();
              }
              count++;
              sum ++ ;
              if (count >= count_std)
              {
                  end_time = get_cur_time();
                  long time_using = end_time - start_time;
                  double time_per_frame = double(time_using)/count_std ;
                  cout << count_std << "帧用时:" << time_using << "ms 每帧用时:" << time_per_frame << "ms" << endl;
                  cout << "keyframe: " << gpuFrame->key_frame << " width: " << gpuFrame->width << " height: "<< gpuFrame->height << endl;
                  cout << gpuFrame->pts << endl;
  
                  count_flag = false;
              }
          }
      }
  }
  
  // string test_uri = "rtmp://192.168.10.56:1935/objecteye/1";
  string test_uri = "/home/cmhu/data/test.mp4";
  
48330793   Hu Chunming   修正解码线程自然结束时解码器内存没...
108
  void createDecode(int index){
aac5773f   hucm   功能基本完成,接口待打磨
109
      FFNvDecoderManager* pDecManager = FFNvDecoderManager::getInstance();
7319ea36   Hu Chunming   多显卡设置
110
      MgrDecConfig config;
48330793   Hu Chunming   修正解码线程自然结束时解码器内存没...
111
      config.name = "dec" + to_string(index);
f40cc409   Hu Chunming   优化显存占用。当前在3080显卡上...
112
      config.cfg.uri = test_uri;
7319ea36   Hu Chunming   多显卡设置
113
114
      config.cfg.post_decoded_cbk = postDecoded;
      config.cfg.force_tcp = true;
f40cc409   Hu Chunming   优化显存占用。当前在3080显卡上...
115
116
117
118
119
120
121
122
123
124
  
      if (index % 2 == 0)
      {
          config.cfg.gpuid = "2";
      }
      else
      {
          config.cfg.gpuid = "1";
      }
      
7319ea36   Hu Chunming   多显卡设置
125
126
127
      FFNvDecoder* decoder = pDecManager->createDecoder(config);
      if (!decoder)
      {
48330793   Hu Chunming   修正解码线程自然结束时解码器内存没...
128
          return ;
7319ea36   Hu Chunming   多显卡设置
129
130
131
      }
      pDecManager->setUserPtr(config.name, decoder);
      pDecManager->startDecodeByName(config.name);
48330793   Hu Chunming   修正解码线程自然结束时解码器内存没...
132
133
  }
  
f40cc409   Hu Chunming   优化显存占用。当前在3080显卡上...
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
  #define checkCudaErrors(S) do {CUresult  status; \
          status = S; \
          if (status != CUDA_SUCCESS ) std::cout << __LINE__ <<" checkCudaErrors - status = " << status << std::endl; \
          } while (false)
  
  int CheckCUDAProperty( int devId )
  {
      cuInit(0);
  
  	CUdevice dev = devId;
  	size_t memSize = 0;
  	char devName[256] = {0};
  	int major = 0, minor = 0;
  	CUresult rlt = CUDA_SUCCESS;
  
  	rlt = cuDeviceComputeCapability( &major, &minor, dev );
  	checkCudaErrors( rlt );
  
  	rlt = cuDeviceGetName( devName, sizeof( devName ), dev );
  	checkCudaErrors( rlt );
  
  	printf( "Using GPU Device %d: %s has SM %d.%d compute capability\n",
  		    dev, devName, major, minor );
  
  	rlt = cuDeviceTotalMem( &memSize, dev );
  	checkCudaErrors( rlt );
  
  	printf( "Total amount of global memory:   %4.4f MB\n",
  		   (float)memSize / ( 1024 * 1024 ) );
  
  	return 0;
  }
  
48330793   Hu Chunming   修正解码线程自然结束时解码器内存没...
167
168
  int main(){
  
f40cc409   Hu Chunming   优化显存占用。当前在3080显卡上...
169
170
      CheckCUDAProperty(1);
  
48330793   Hu Chunming   修正解码线程自然结束时解码器内存没...
171
      FFNvDecoderManager* pDecManager = FFNvDecoderManager::getInstance();
7319ea36   Hu Chunming   多显卡设置
172
  
f40cc409   Hu Chunming   优化显存占用。当前在3080显卡上...
173
174
175
176
177
      int count = 105;
      for (size_t i = 0; i < count ; i++)
      {
          createDecode(i);
      }
48330793   Hu Chunming   修正解码线程自然结束时解码器内存没...
178
179
  
      MgrDecConfig config;
f40cc409   Hu Chunming   优化显存占用。当前在3080显卡上...
180
181
182
      config.name = "dec";
      config.cfg.uri = test_uri;
      config.cfg.post_decoded_cbk = postDecoded0;
48330793   Hu Chunming   修正解码线程自然结束时解码器内存没...
183
      config.cfg.force_tcp = true;
f40cc409   Hu Chunming   优化显存占用。当前在3080显卡上...
184
      config.cfg.gpuid = "1";
7319ea36   Hu Chunming   多显卡设置
185
      FFNvDecoder* dec2 = pDecManager->createDecoder(config);
aac5773f   hucm   功能基本完成,接口待打磨
186
187
188
189
      if (!dec2)
      {
          return 1;
      }
7319ea36   Hu Chunming   多显卡设置
190
191
192
      pDecManager->setUserPtr(config.name, dec2);
      pDecManager->startDecodeByName(config.name);
  
f40cc409   Hu Chunming   优化显存占用。当前在3080显卡上...
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
      pthread_t m_decode_thread;
      pthread_create(&m_decode_thread,0,
          [](void* arg)
          {
              while (true)
              {
                  std::this_thread::sleep_for(std::chrono::milliseconds(5000));
                  FFNvDecoderManager* pDecManager = FFNvDecoderManager::getInstance();
                  int count = pDecManager->count();
                  cout << "当前运行路数: " << pDecManager->count() << endl;
                  if (count <= 0)
                  {
                      break;
                  }
              }  
  
              return (void*)0;
          }
      ,nullptr);
  
7319ea36   Hu Chunming   多显卡设置
213
      
48330793   Hu Chunming   修正解码线程自然结束时解码器内存没...
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
      // config.name = "dec0";
      // config.cfg.uri = "rtmp://192.168.10.56:1935/objecteye/1";
      // config.cfg.gpuid = "0";
      // FFNvDecoder* dec0 = pDecManager->createDecoder(config);
      // if (!dec0)
      // {
      //     return 1;
      // }
      // pDecManager->setUserPtr(config.name, dec0);
      // pDecManager->startDecodeByName(config.name);
  
      // config.name = "dec01";
      // config.cfg.uri = "rtmp://192.168.10.56:1935/objecteye/1";
      // config.cfg.gpuid = "0";
      // FFNvDecoder* dec01 = pDecManager->createDecoder(config);
      // if (!dec01)
      // {
      //     return 1;
      // }
      // pDecManager->setUserPtr(config.name, dec01);
      // pDecManager->startDecodeByName(config.name);
aac5773f   hucm   功能基本完成,接口待打磨
235
  
e41a52bb   Hu Chunming   1.优化数据读取线程;2. 添加A...
236
      // while (getchar() != 'q');  
aac5773f   hucm   功能基本完成,接口待打磨
237
  
e41a52bb   Hu Chunming   1.优化数据读取线程;2. 添加A...
238
239
240
      // // pDecManager->closeDecoderByName("dec1");
      // // pDecManager->pauseDecoder("dec1");
      // pDecManager->pauseDecoder("dec2");
aac5773f   hucm   功能基本完成,接口待打磨
241
  
e41a52bb   Hu Chunming   1.优化数据读取线程;2. 添加A...
242
      // while (getchar() != 'q');
aac5773f   hucm   功能基本完成,接口待打磨
243
  
e41a52bb   Hu Chunming   1.优化数据读取线程;2. 添加A...
244
245
      // // pDecManager->resumeDecoder("dec1");
      // pDecManager->resumeDecoder("dec2");
aac5773f   hucm   功能基本完成,接口待打磨
246
  
f40cc409   Hu Chunming   优化显存占用。当前在3080显卡上...
247
248
      cout << "总共帧数:" << sum << endl;
  
aac5773f   hucm   功能基本完成,接口待打磨
249
250
251
252
      while (getchar() != 'q');
  
      pDecManager->closeAllDecoder();
  }