【代码阅读】darknet源码阅读(二):utils.h 与 utils.c

参考文献依然是放前面:https://blog.csdn.net/caicaiatnbu/category_9096319.html

但我主要是以这个版本的darknet【 https://github.com/AlexeyAB/darknet】,与原始的版本还是有一点区别的。

步入正题,utils主要是进行一些读写操作。

读代码好长。。抽空读,中间有两次突然断电,注释都没保存,后面也懒得补了,我会坚持的!努力学C++

1.utils.h

#ifndef UTILS_H
#define UTILS_H
#include "darknet.h"
#include "list.h"

#include <stdio.h>
#include <time.h>

#ifndef M_PI
#define M_PI       3.14159265358979323846   // pi
#endif

#ifdef __cplusplus
extern "C" {  //这个在list的解析里提到过,要以C的方式链接
#endif

LIB_API void free_ptrs(void **ptrs, int n);
LIB_API void top_k(float *a, int n, int k, int *index);

void *xmalloc(size_t size);
void *xcalloc(size_t nmemb, size_t size);
void *xrealloc(void *ptr, size_t size);


double what_time_is_it_now();//获得当前的时间
int *read_map(char *filename);//
void shuffle(void *arr, size_t n, size_t size);//对数组进行洗牌操作
void sorta_shuffle(void *arr, size_t n, size_t size, size_t sections);
char *basecfg(char *cfgfile);
int alphanum_to_int(char c);
char int_to_alphanum(int i);
int read_int(int fd);
void write_int(int fd, int n);
void read_all(int fd, char *buffer, size_t bytes);
void write_all(int fd, char *buffer, size_t bytes);
int read_all_fail(int fd, char *buffer, size_t bytes);
int write_all_fail(int fd, char *buffer, size_t bytes);
LIB_API void find_replace(const char* str, char* orig, char* rep, char* output);
void replace_image_to_label(const char* input_path, char* output_path);
void error(const char *s);
void malloc_error();
void calloc_error();
void realloc_error();
void file_error(char *s);
void strip(char *s);
void strip_args(char *s);
void strip_char(char *s, char bad);
list *split_str(char *s, char delim);
char *fgetl(FILE *fp);
list *parse_csv_line(char *line);
char *copy_string(char *s);
int count_fields(char *line);
float *parse_fields(char *line, int n);
void normalize_array(float *a, int n);
void scale_array(float *a, int n, float s);
void translate_array(float *a, int n, float s);
int max_index(float *a, int n);
int top_max_index(float *a, int n, int k);
float constrain(float min, float max, float a);
int constrain_int(int a, int min, int max);
float mse_array(float *a, int n);
float rand_normal();
size_t rand_size_t();
float rand_uniform(float min, float max);
float rand_scale(float s);
int rand_int(int min, int max);
float sum_array(float *a, int n);
float mean_array(float *a, int n);
void mean_arrays(float **a, int n, int els, float *avg);
float variance_array(float *a, int n);
float mag_array(float *a, int n);
float mag_array_skip(float *a, int n, int * indices_to_skip);
float dist_array(float *a, float *b, int n, int sub);
float **one_hot_encode(float *a, int n, int k);
float sec(clock_t clocks);
int find_int_arg(int argc, char **argv, char *arg, int def);
float find_float_arg(int argc, char **argv, char *arg, float def);
int find_arg(int argc, char* argv[], char *arg);
char *find_char_arg(int argc, char **argv, char *arg, char *def);
int sample_array(float *a, int n);
int sample_array_custom(float *a, int n);
void print_statistics(float *a, int n);
unsigned int random_gen_fast(void);
float random_float_fast();
int rand_int_fast(int min, int max);
unsigned int random_gen();
float random_float();
float rand_uniform_strong(float min, float max);
float rand_precalc_random(float min, float max, float random_part);
double double_rand(void);
unsigned int uint_rand(unsigned int less_than);
int check_array_is_nan(float *arr, int size);
int check_array_is_inf(float *arr, int size);
int int_index(int *a, int val, int n);
int *random_index_order(int min, int max);
int max_int_index(int *a, int n);
boxabs box_to_boxabs(const box* b, const int img_w, const int img_h, const int bounds_check);
int make_directory(char *path, int mode);

#define max_val_cmp(a,b) (((a) > (b)) ? (a) : (b))
#define min_val_cmp(a,b) (((a) < (b)) ? (a) : (b))

#ifdef __cplusplus
}
#endif

#endif

2.utils.c

#ifndef _GNU_SOURCE
#define _GNU_SOURCE
#endif
#include "utils.h"
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#ifndef _USE_MATH_DEFINES
#define _USE_MATH_DEFINES
#endif
#include <math.h>
#include <assert.h>
#include <float.h>
#include <limits.h>
#include "darkunistd.h"
#ifdef WIN32
#include "gettimeofday.h"
#else
#include <sys/time.h>
#include <sys/stat.h>
#endif


#ifndef USE_CMAKE_LIBS
#pragma warning(disable: 4996)
#endif

//malloc构建size大小的存储空间
void *xmalloc(size_t size) {
    void *ptr=malloc(size);
    if(!ptr) {
        malloc_error();
    }
    return ptr;
}


//calloc构建size大小的存储空间
void *xcalloc(size_t nmemb, size_t size) {
    void *ptr=calloc(nmemb,size);
    if(!ptr) {
        calloc_error();
    }
    return ptr;
}

//realloc扩大存储空间
void *xrealloc(void *ptr, size_t size) {
    ptr=realloc(ptr,size);
    if(!ptr) {
        realloc_error();
    }
    return ptr;
}

// 获得当前时间,到秒的时间戳,并对微秒进行四舍五入。
double what_time_is_it_now()
{
    /*
    struct timeval
    {
        __time_t tv_sec;        /* Seconds. */
        __suseconds_t tv_usec;  /* Microseconds. */
     };
    tv_sec为Epoch到创建struct timeval时的秒数,tv_usec为微秒数,即秒后面的零头。即当前时间距Epoch时间tv_sec秒,tv_usec微秒。
    */

    struct timeval time; 
    //int gettimeofday(struct  timeval*tv,struct  timezone *tz )
    //gettimeofday()会把目前的时间用tv 结构体返回,当地时区的信息则放到tz所指的结构中
    //在gettimeofday()函数中tv或者tz都可以为空。如果为空则就不返回其对应的结构体。
    //获取时间
    if (gettimeofday(&time, NULL)) {
        return 0;
    }
    // tv_usec 获取到微秒,需要10^-6转换为秒
    return (double)time.tv_sec + (double)time.tv_usec * .000001;
}

// 读取指定文件中,每一行的最开始的整数,保存到一维数组中,数组长度为文件的有效行数。
int *read_map(char *filename)
{
    int n = 0;
    int *map = 0;
    char *str;
    FILE *file = fopen(filename, "r");//打开文件
    if(!file) file_error(filename);//判断是否成功打开
    //fgetl:从文件中读取一行数据,并去掉行末的换行符
    while((str=fgetl(file))){//逐行获得数据
        ++n;
        map = (int*)xrealloc(map, n * sizeof(int));//realloc扩大数据空间,size为数据的长度
        map[n-1] = atoi(str);//将字符串转换为整型数据【跳过空格,tab】,存放到map末尾中
        free(str);
    }
    if (file) fclose(file);
    return map;
}

// 对每一个sections进行洗牌操作
//在64位系统中为long long unsigned int,非64位系统中为long unsigned int
//在某些情况下,使用size_t类型是更为有效,比习惯性使用无符号类型的程序会更安全。
void sorta_shuffle(void *arr, size_t n, size_t size, size_t sections)
{
    size_t i;
    for(i = 0; i < sections; ++i){
        size_t start = n*i/sections;
        size_t end = n*(i+1)/sections;
        size_t num = end-start;
        shuffle((char*)arr+(start*size), num, size);// shuffle对数组进行洗牌操作
    }
}

// 对数组进行洗牌操作
void shuffle(void *arr, size_t n, size_t size)
{
    size_t i;
    void* swp = (void*)xcalloc(1, size); //分配一个1个长度为size的连续空间
    for(i = 0; i < n-1; ++i){
        size_t j = i + random_gen()/(RAND_MAX / (n-i)+1);//进行洗牌操作【?】
        memcpy(swp,            (char*)arr+(j*size), size);
        memcpy((char*)arr+(j*size), (char*)arr+(i*size), size);
        memcpy((char*)arr+(i*size), swp,          size);
    }
    free(swp);
}

// 就是删除,从第index+1开始,到argc结束,将argv元素向左移动,最后一个元素置null
void del_arg(int argc, char **argv, int index)
{
    int i;
    for(i = index; i < argc-1; ++i) argv[i] = argv[i+1];
    argv[i] = 0;
}

// 删除指定字符串 arg,其后面的字符串往左移动
int find_arg(int argc, char* argv[], char *arg)
{
    int i;
    for(i = 0; i < argc; ++i) {
        if(!argv[i]) continue;
        if(0==strcmp(argv[i], arg)) {//如果有arg相同的字符
            del_arg(argc, argv, i);//删除【这里应该只能删除第一个碰到的相同字符吧?】
            return 1;
        }
    }
    return 0;
}

//查找字符串arg, 后面的参数往左一定两个位置(删除)
int find_int_arg(int argc, char **argv, char *arg, int def)
{
    int i;
    for(i = 0; i < argc-1; ++i){//在这个范围内
        if(!argv[i]) continue;
        if(0==strcmp(argv[i], arg)){//找到了目标值
            def = atoi(argv[i+1]);目标值后一位转为int【?】
            del_arg(argc, argv, i);
            del_arg(argc, argv, i);//这里删除目标值和目标值后一位【?感觉应该是读cfg文件时要用到的,要继续往后看】
            break;
        }
    }
    return def;//返回目标值
}

//同上int 
float find_float_arg(int argc, char **argv, char *arg, float def)
{
    int i;
    for(i = 0; i < argc-1; ++i){
        if(!argv[i]) continue;
        if(0==strcmp(argv[i], arg)){
            def = atof(argv[i+1]);
            del_arg(argc, argv, i);
            del_arg(argc, argv, i);
            break;
        }
    }
    return def;
}

//同上int
char *find_char_arg(int argc, char **argv, char *arg, char *def)
{
    int i;
    for(i = 0; i < argc-1; ++i){
        if(!argv[i]) continue;
        if(0==strcmp(argv[i], arg)){
            def = argv[i+1];
            del_arg(argc, argv, i);
            del_arg(argc, argv, i);
            break;
        }
    }
    return def;
}


// 提取cfg文件的文件名,
//比如cfg/yolo-tiny.cfg-->yolo-tiny.cfg
//cfg\\yolo-tiny.cfg-->yolo-tiny.cfg
char *basecfg(char *cfgfile)
{
    char *c = cfgfile;
    char *next;
    // 查找到最后一个 '/', 只要最后一个'/'后面的内容
    while((next = strchr(c, '/')))
    {
        c = next+1;
    }
    //查找到最后一个 '\\', 只要最后一个'\\'后面的内容
    if(!next) while ((next = strchr(c, '\\'))) { c = next + 1; }
    c = copy_string(c);//将文件名给c
    next = strchr(c, '.');//yolo-tiny.cfg-->next=.cfg
    if (next) *next = 0;//next 部分置0
    return c;
}

// 字符转整型
int alphanum_to_int(char c)
{
    return (c < 58) ? c - 48 : c-87;
}

// 整型转字符
char int_to_alphanum(int i)
{
    if (i == 36) return '.';
    return (i < 10) ? i + 48 : i + 87;
}

// 可视化float数组A,M×N列
void pm(int M, int N, float *A)
{
    int i,j;
    for(i =0 ; i < M; ++i){
        printf("%d ", i+1);
        for(j = 0; j < N; ++j){
            printf("%2.4f, ", A[i*N+j]);
        }
        printf("\n");
    }
    printf("\n");
}

// 判断str中是否出现子串orig,若出现则进行替代;
void find_replace(const char* str, char* orig, char* rep, char* output)
{
    char* buffer = (char*)calloc(8192, sizeof(char));
    char *p;

    sprintf(buffer, "%s", str);
    // 判断orig是否是buffer的子串,若是返回orig在buffer的起始地址,否则返回null
    if (!(p = strstr(buffer, orig))) {  // Is 'orig' even in 'str'?
        sprintf(output, "%s", buffer);
        free(buffer);
        return;
    }

    *p = '\0';// sprintf拼接必须是'\0'结尾的字符数组;
    //将origin用rep代替
    sprintf(output, "%s%s%s", buffer, rep, p + strlen(orig));
    free(buffer);
}

//将读取的字符串进行精简,删掉最开始和最末尾可能存在的' '和'\t'
//比如' \t   yolo-tiny   \t'-->'yolo-tiny'
void trim(char *str)
{
    char* buffer = (char*)xcalloc(8192, sizeof(char));
    sprintf(buffer, "%s", str);

    char *p = buffer;
    while (*p == ' ' || *p == '\t') ++p;//判断str中开头部分是否有' '和'\t'如果有就跳过

    char *end = p + strlen(p) - 1;//排除开头的空格部分后,找到p的最末尾
    while (*end == ' ' || *end == '\t') { //判断str中,从末尾开始是否有' '和'\t'如果有就截掉
        *end = '\0';
        --end;//重新设定末尾位置
    }
    sprintf(str, "%s", p);

    free(buffer);
}


void find_replace_extension(char *str, char *orig, char *rep, char *output)
{
    char* buffer = (char*)calloc(8192, sizeof(char));//缓冲空间,中转站

    sprintf(buffer, "%s", str);
    char *p = strstr(buffer, orig);// 判断orig是否是buffer的子串,若是返回orig在buffer的起始地址,否则返回null给p
    int offset = (p - buffer);//获得子串的位移长度,子串起始地址到buffer的起始地址
    int chars_from_end = strlen(buffer) - offset;//获得从子串起始地址到末尾的长度
    //如果p==null或者获得从子串起始地址到末尾的长度不等于子串的长度,则返回orig在buffer的起始地址,否则返回null
    if (!p || chars_from_end != strlen(orig)) {  // Is 'orig' even in 'str' AND is 'orig' found at the end of 'str'?
        sprintf(output, "%s", buffer);
        free(buffer);
        return;
    }

    *p = '\0';

    //将origin用rep代替
    sprintf(output, "%s%s%s", buffer, rep, p + strlen(orig));
    free(buffer);
}

void replace_image_to_label(const char* input_path, char* output_path)
{
    find_replace(input_path, "/images/train2014/", "/labels/train2014/", output_path);    // COCO
    find_replace(output_path, "/images/val2014/", "/labels/val2014/", output_path);        // COCO
    find_replace(output_path, "/JPEGImages/", "/labels/", output_path);    // PascalVOC
    find_replace(output_path, "\\images\\train2014\\", "\\labels\\train2014\\", output_path);    // COCO
    find_replace(output_path, "\\images\\val2014\\", "\\labels\\val2014\\", output_path);        // COCO
    find_replace(output_path, "\\JPEGImages\\", "\\labels\\", output_path);    // PascalVOC
    //find_replace(output_path, "/images/", "/labels/", output_path);    // COCO
    //find_replace(output_path, "/VOC2007/JPEGImages/", "/VOC2007/labels/", output_path);        // PascalVOC
    //find_replace(output_path, "/VOC2012/JPEGImages/", "/VOC2012/labels/", output_path);        // PascalVOC

    //find_replace(output_path, "/raw/", "/labels/", output_path);
    trim(output_path);

    // replace only ext of files
    find_replace_extension(output_path, ".jpg", ".txt", output_path);
    find_replace_extension(output_path, ".JPG", ".txt", output_path); // error
    find_replace_extension(output_path, ".jpeg", ".txt", output_path);
    find_replace_extension(output_path, ".JPEG", ".txt", output_path);
    find_replace_extension(output_path, ".png", ".txt", output_path);
    find_replace_extension(output_path, ".PNG", ".txt", output_path);
    find_replace_extension(output_path, ".bmp", ".txt", output_path);
    find_replace_extension(output_path, ".BMP", ".txt", output_path);
    find_replace_extension(output_path, ".ppm", ".txt", output_path);
    find_replace_extension(output_path, ".PPM", ".txt", output_path);
    find_replace_extension(output_path, ".tiff", ".txt", output_path);
    find_replace_extension(output_path, ".TIFF", ".txt", output_path);

    // Check file ends with txt:
    if(strlen(output_path) > 4) {
        char *output_path_ext = output_path + strlen(output_path) - 4;
        if( strcmp(".txt", output_path_ext) != 0){
            fprintf(stderr, "Failed to infer label file name (check image extension is supported): %s \n", output_path);
        }
    }else{
        fprintf(stderr, "Label file name is too short: %s \n", output_path);
    }
}

float sec(clock_t clocks)
{
    return (float)clocks/CLOCKS_PER_SEC;
}

void top_k(float *a, int n, int k, int *index)
{
    int i,j;
    for(j = 0; j < k; ++j) index[j] = -1;
    for(i = 0; i < n; ++i){
        int curr = i;
        for(j = 0; j < k; ++j){
            if((index[j] < 0) || a[curr] > a[index[j]]){
                int swap = curr;
                curr = index[j];
                index[j] = swap;
            }
        }
    }
}

void error(const char *s)
{
    perror(s);
    assert(0);
    exit(EXIT_FAILURE);
}

void malloc_error()
{
    fprintf(stderr, "xMalloc error\n");
    exit(EXIT_FAILURE);
}

void calloc_error()
{
    fprintf(stderr, "Calloc error\n");
    exit(EXIT_FAILURE);
}

void realloc_error()
{
    fprintf(stderr, "Realloc error\n");
    exit(EXIT_FAILURE);
}

void file_error(char *s)
{
    fprintf(stderr, "Couldn't open file: %s\n", s);
    exit(EXIT_FAILURE);
}

list *split_str(char *s, char delim)
{
    size_t i;
    size_t len = strlen(s);
    list *l = make_list();
    list_insert(l, s);
    for(i = 0; i < len; ++i){
        if(s[i] == delim){
            s[i] = '\0';
            list_insert(l, &(s[i+1]));
        }
    }
    return l;
}

void strip(char *s)
{
    size_t i;
    size_t len = strlen(s);
    size_t offset = 0;
    for(i = 0; i < len; ++i){
        char c = s[i];
        if(c==' '||c=='\t'||c=='\n'||c =='\r'||c==0x0d||c==0x0a) ++offset;
        else s[i-offset] = c;
    }
    s[len-offset] = '\0';
}


void strip_args(char *s)
{
    size_t i;
    size_t len = strlen(s);
    size_t offset = 0;
    for (i = 0; i < len; ++i) {
        char c = s[i];
        if (c == '\t' || c == '\n' || c == '\r' || c == 0x0d || c == 0x0a) ++offset;
        else s[i - offset] = c;
    }
    s[len - offset] = '\0';
}

void strip_char(char *s, char bad)
{
    size_t i;
    size_t len = strlen(s);
    size_t offset = 0;
    for(i = 0; i < len; ++i){
        char c = s[i];
        if(c==bad) ++offset;
        else s[i-offset] = c;
    }
    s[len-offset] = '\0';
}

void free_ptrs(void **ptrs, int n)
{
    int i;
    for(i = 0; i < n; ++i) free(ptrs[i]);
    free(ptrs);
}

// 读取指定文件中的一行字符
char *fgetl(FILE *fp)
{
    // feof()检测流文件指针是否已到文件结尾。文件读取结束,返回非0,否则返回0.
    if(feof(fp)) return 0;
    size_t size = 512;// 申请512个字符空间
    char* line = (char*)xmalloc(size * sizeof(char));

    //fgets 读取文件中一行的数据,存放到line中.读取失败或读取到换行符或读取到文件末尾返回,读取fgets失败返回null
    if(!fgets(line, size, fp)){
        free(line);
        return 0;
    }

    size_t curr = strlen(line);//获得当前读取数据的curr_size
    
    //读取未满一行时,最后一个字符不为'\n'且文件流文件指针没有到结尾
    while((line[curr-1] != '\n') && !feof(fp)){
        //如果curr_size的大小等于之前构建的字符空间,那么进行扩容
        if(curr == size-1){
            size *= 2;
            line = (char*)xrealloc(line, size * sizeof(char));
        }
        size_t readsize = size-curr;//可读size获得
        if(readsize > INT_MAX) readsize = INT_MAX-1; //判断界限,不能超过INTMAX,上溢
        fgets(&line[curr], readsize, fp);//继续读取剩余部分的数据
        curr = strlen(line);//获得新的数据size
    }
    // 手动字符串补0
    //index n-1处为'\n'表示读完了一行,将其修改为'\0',因为字符数组默认结果为'\0',需手动补上
    if(curr >= 2)
        if(line[curr-2] == 0x0d) line[curr-2] = 0x00;
    if(curr >= 1)
        if(line[curr-1] == 0x0a) line[curr-1] = 0x00;

    return line;
}

//读整型数据
int read_int(int fd)
{
    int n = 0;
    // next为成功读取的字节数,如果为-1,则表示读取失败,若调read之前已经到达文件末尾,则这次read返回0.
    int next = read(fd, &n, sizeof(int));
    if(next <= 0) return -1;
    return n;
}

// 向文件fd中写入一个整数
void write_int(int fd, int n)
{
    int next = write(fd, &n, sizeof(int));
    if(next <= 0) error("read failed");
}

// 从fd文件中,读取bytes个字节数据到内存中buffer起始,直到读完
int read_all_fail(int fd, char *buffer, size_t bytes)
{
    size_t n = 0;
    while(n < bytes){
        int next = read(fd, buffer + n, bytes-n);
        if(next <= 0) return 1;
        n += next;
    }
    return 0;
}

// 将内存中buffer起始的bytes个字节数据写入到fd文件中,直到写完
int write_all_fail(int fd, char *buffer, size_t bytes)
{
    size_t n = 0;
    while(n < bytes){
        // 将buffer+n 所指向的内存写入bytes-n个字节到fd文件中
        size_t next = write(fd, buffer + n, bytes-n);
        //如果写入成功,会返回写入的字节数,即返回 bytes,否则,返回-1【写入失败】
        if(next <= 0) return 1;
        n += next;//更新读取的字节数直到满足 bytes的要求
    }
    return 0;
}

// 将内存中buffer起始的bytes个字节数据写入到fd文件中,一次性操作,若写不完,则报错
void read_all(int fd, char *buffer, size_t bytes)
{
    size_t n = 0;
    while(n < bytes){
        int next = read(fd, buffer + n, bytes-n);
        if(next <= 0) error("read failed");
        n += next;
    }
}

// 从fd文件中,读取bytes个字节数据到内存中buffer起始,一次性操作,若读不完,则报错
void write_all(int fd, char *buffer, size_t bytes)
{
    size_t n = 0;
    while(n < bytes){
        size_t next = write(fd, buffer + n, bytes-n);
        if(next <= 0) error("write failed");
        n += next;
    }
}

// 字符数组的复制操作
char *copy_string(char *s)
{
    if(!s) {
        return NULL;
    }
    char* copy = (char*)xmalloc(strlen(s) + 1);//空间
    //将以s地址开始的前strlen(s) + 1 个字节复制到copy所指向的数组中
    strncpy(copy, s, strlen(s)+1);
    return copy;
}

// 解析某种特定格式,如: "******, "222,"32242, "342423
list *parse_csv_line(char *line)
{
    list *l = make_list();// 链表初始化
    char *c, *p;
    int in = 0;
    // 遍历字符数组line
    for(c = line, p = line; *c != '\0'; ++c){
        if(*c == '"') in = !in;//如果有",则in=1
        else if(*c == ',' && !in){//如果有,且in=0-->遇到','截断
            *c = '\0';//将该位置截止符
            //用list插入函数将得到的字符串,放入l中
            list_insert(l, copy_string(p));
            p = c+1;//更新循环信息
        }
    }
    list_insert(l, copy_string(p));//插入最后的剩余部分
    return l;
}

// 统计字符数组中有多少','字符以及'\0'
int count_fields(char *line)
{
    int count = 0;
    int done = 0;
    char *c;
    for(c = line; !done; ++c){
        done = (*c == '\0');//判断是否结尾【?】
        if(*c == ',' || done) ++count;
    }
    return count;
}

// 解析字符数组中的float实数
float *parse_fields(char *line, int n)
{
    float* field = (float*)xcalloc(n, sizeof(float));//申请空间
    char *c, *p, *end;
    int count = 0;
    int done = 0;
    for(c = line, p = line; !done; ++c){
        done = (*c == '\0');//判断是否到末尾
        if(*c == ',' || done){//如果到末尾或者遇到','字符,进入循环,如果没有碰到则将c指针加一,获取下一字符,这时候p是保持不变的;
            *c = '\0';//将字符截断
//strtod将字符串转换为float类型 ,会跳过前面的空格字符,直到遇到数字或者+/- 才开始转换,到出现非数字或者字符串结束符'\0'结束;end,
            field[count] = strtod(p, &end); //将截断的字符中可转换的字符转换为float型

// 如果转换数字开始位置指针p 和 工作指针c指向同一地址,表明,一开始就遇到','或者'\0',肯定不合理,使用nan函数
            if(p == c) field[count] = nan("");


            if(end != c && (end != c-1 || *end != '\r')) field[count] = nan(""); //DOS file formats!【?这里不太懂】
            p = c+1;//这一段转换结束后,将p起始位置放到与c一样的时候
            ++count;//并且统计截断字符的次数
        }
    }
    return field;
}

// 对float一维数组求和,比较好理解
float sum_array(float *a, int n)
{
    int i;
    float sum = 0;
    for(i = 0; i < n; ++i) sum += a[i];
    return sum;
}

//对float一维数组计算均值
float mean_array(float *a, int n)
{
    return sum_array(a,n)/n;
}

// 求二维float数组,每一列的平均值,保存在avg一维float数组中
void mean_arrays(float **a, int n, int els, float *avg)
{
    int i;
    int j;
    memset(avg, 0, els*sizeof(float));
    for(j = 0; j < n; ++j){
        for(i = 0; i < els; ++i){
            avg[i] += a[j][i];
        }
    }
    for(i = 0; i < els; ++i){
        avg[i] /= n;
    }
}

// 计算向量a的mean和var,并输出
void print_statistics(float *a, int n)
{
    float m = mean_array(a, n);
    float v = variance_array(a, n);
    printf("MSE: %.6f, Mean: %.6f, Variance: %.6f\n", mse_array(a, n), m, v);
}

// 对float一维数组求方差
float variance_array(float *a, int n)
{
    int i;
    float sum = 0;
    float mean = mean_array(a, n);
    for(i = 0; i < n; ++i) sum += (a[i] - mean)*(a[i]-mean);//计算方差
    float variance = sum/n;
    return variance;
}

// 判断整数a 与 区间整数[min, max]的关系,超过区间返回区间上下限
int constrain_int(int a, int min, int max)
{
    if (a < min) return min;
    if (a > max) return max;
    return a;
}

// 判断小数a 与 区间小数[min, max]的关系,超过区间返回区间上下限
float constrain(float min, float max, float a)
{
    if (a < min) return min;
    if (a > max) return max;
    return a;
}

// 当sub为1的时候,其实就是计算两个一维数组的欧式距离
float dist_array(float *a, float *b, int n, int sub)
{
    int i;
    float sum = 0;
    for(i = 0; i < n; i += sub) sum += pow(a[i]-b[i], 2);
    return sqrt(sum);
}
// 向量的模长除以N
float mse_array(float *a, int n)
{
    int i;
    float sum = 0;
    for(i = 0; i < n; ++i) sum += a[i]*a[i];
    return sqrt(sum/n);
}

// 归一化操作
void normalize_array(float *a, int n)
{
    int i;
    float mu = mean_array(a,n);//均值
    float sigma = sqrt(variance_array(a,n));//方差
    for(i = 0; i < n; ++i){
        a[i] = (a[i] - mu)/sigma;//归一化
    }
    mu = mean_array(a,n);//重新得到均值
    sigma = sqrt(variance_array(a,n));//重新得到方差
}

//向量平移
void translate_array(float *a, int n, float s)
{
    int i;
    for(i = 0; i < n; ++i){
        a[i] += s;
    }
}

//向量取模
float mag_array(float *a, int n)
{
    int i;
    float sum = 0;
    for(i = 0; i < n; ++i){
        sum += a[i]*a[i];
    }
    return sqrt(sum);
}

//这里就是取需要的数据向量的模
// indicies to skip is a bit array
float mag_array_skip(float *a, int n, int * indices_to_skip)
{
    int i;
    float sum = 0;
    for (i = 0; i < n; ++i) {
        if (indices_to_skip[i] != 1) {
            sum += a[i] * a[i];
        }
    }
    return sqrt(sum);
}
 

// 向量的与实数的乘法
void scale_array(float *a, int n, float s)
{
    int i;
    for(i = 0; i < n; ++i){
        a[i] *= s;
    }
}

 
// 从向量中采用一个数,返回其index
int sample_array(float *a, int n)
{
    float sum = sum_array(a, n);
    scale_array(a, n, 1. / sum);
    float r = rand_uniform(0, 1);//随机生成0-1的数
    int i;
    for (i = 0; i < n; ++i) {
        r = r - a[i];//满足条件计算
        if (r <= 0) return i;//若满足则返回值的位置
    }
    return n - 1;
}

//与上面函数是一个功能,只是需要满足的条件不同,
int sample_array_custom(float *a, int n)
{
    float sum = sum_array(a, n);
    scale_array(a, n, 1./sum);
    float r = rand_uniform(0, 1);
    int start_index = rand_int(0, 0);
    int i;
    for(i = 0; i < n; ++i){
        r = r - a[(i + start_index) % n];
        if (r <= 0) return i;
    }
    return n-1;
}
// 一维int数组找最大值操作,若找到最大值,返回index,否则,返回-1;
int max_index(float *a, int n)
{
    if(n <= 0) return -1;
    int i, max_i = 0;
    float max = a[0];
    for(i = 1; i < n; ++i){
        if(a[i] > max){
            max = a[i];
            max_i = i;
        }
    }
    return max_i;
}


int top_max_index(float *a, int n, int k)
{
    if (n <= 0) return -1;
    float *values = (float*)xcalloc(k, sizeof(float));
    int *indexes = (int*)xcalloc(k, sizeof(int));//构建临时空间
    int i, j;
    for (i = 0; i < n; ++i) {
        for (j = 0; j < k; ++j) {
            if (a[i] > values[j]) {//局部最大值【?】
                values[j] = a[i];
                indexes[j] = i;
                break;
            }
        }
    }
    int count = 0;
    for (j = 0; j < k; ++j) if (values[j] > 0) count++;//判断局部最大值的个数
    int get_index = rand_int(0, count-1);// 返回一个区间[0, count-1]内的一个整数
    int val = indexes[get_index];//获得该位置的值,并返回
    free(indexes);
    free(values);
    return val;
}

// 一维数组进行查找操作,若查找指定值,返回index,否则,返回-1;
int int_index(int *a, int val, int n)
{
    int i;
    for (i = 0; i < n; ++i) {
        if (a[i] == val) return i;
    }
    return -1;
}

 
// 返回一个区间[min, max]内的一个整数
int rand_int(int min, int max)
{
    if (max < min){
        int s = min;
        min = max;
        max = s;
    }
    int r = (random_gen()%(max - min + 1)) + min;
    return r;
}

// From http://en.wikipedia.org/wiki/Box%E2%80%93Muller_transform
// 标准正太分布
float rand_normal()
{
    static int haveSpare = 0;
    static double rand1, rand2;

    if(haveSpare)
    {
        haveSpare = 0;
        return sqrt(rand1) * sin(rand2);
    }

    haveSpare = 1;
    // 获取区间[0,1]内的一个随机数
    rand1 = random_gen() / ((double) RAND_MAX);
    if(rand1 < 1e-100) rand1 = 1e-100;
    rand1 = -2 * log(rand1);
    rand2 = (random_gen() / ((double)RAND_MAX)) * 2.0 * M_PI;

    return sqrt(rand1) * cos(rand2);
}

/*
   float rand_normal()
   {
   int n = 12;
   int i;
   float sum= 0;
   for(i = 0; i < n; ++i) sum += (float)random_gen()/RAND_MAX;
   return sum-n/2.;
   }
 */

size_t rand_size_t()
{
    return  ((size_t)(random_gen()&0xff) << 56) |
            ((size_t)(random_gen()&0xff) << 48) |
            ((size_t)(random_gen()&0xff) << 40) |
            ((size_t)(random_gen()&0xff) << 32) |
            ((size_t)(random_gen()&0xff) << 24) |
            ((size_t)(random_gen()&0xff) << 16) |
            ((size_t)(random_gen()&0xff) << 8) |
            ((size_t)(random_gen()&0xff) << 0);
}

// 进行随机采样操作,从区间[min, max]随机返回一个实数
float rand_uniform(float min, float max)
{
    if(max < min){
        float swap = min;
        min = max;
        max = swap;
    }

//局限范围有效
#if (RAND_MAX < 65536)
        int rnd = rand()*(RAND_MAX + 1) + rand();
        return ((float)rnd / (RAND_MAX*RAND_MAX) * (max - min)) + min;
#else
        return ((float)rand() / RAND_MAX * (max - min)) + min;
#endif
    //return (random_float() * (max - min)) + min;
}

 
// 随机采用的基础上,50%的概率返回S,50%的概率返回1/s
float rand_scale(float s)
{
    float scale = rand_uniform_strong(1, s);
    if(random_gen()%2) return scale;
    return 1./scale;
}

// 进行one_hot 编码,根据,float数组a中的元素进行编码
float **one_hot_encode(float *a, int n, int k)
{
    int i;
    float** t = (float**)xcalloc(n, sizeof(float*)); // 申请n个float * 指针存储空间
    for(i = 0; i < n; ++i){
        t[i] = (float*)xcalloc(k, sizeof(float)); // 每个t中的元素为一个float 指针,指向k个float
        int index = (int)a[i];// 丢掉小数部分
        t[i][index] = 1; //第index 置为1
    }
    return t;
}

static unsigned int x = 123456789, y = 362436069, z = 521288629;

// Marsaglia's xorshf96 generator: period 2^96-1
unsigned int random_gen_fast(void)
{
    unsigned int t;
    x ^= x << 16; //x*(2^16)  ^  x
    x ^= x >> 5;
    x ^= x << 1;

    t = x;
    x = y;
    y = z;
    z = t ^ x ^ y;

    return z;
}

float random_float_fast()
{
    return ((float)random_gen_fast() / (float)UINT_MAX);
}

int rand_int_fast(int min, int max)
{
    if (max < min) {
        int s = min;
        min = max;
        max = s;
    }
    int r = (random_gen_fast() % (max - min + 1)) + min;
    return r;
}

unsigned int random_gen()
{
    unsigned int rnd = 0;
#ifdef WIN32
    rand_s(&rnd);
#else   // WIN32
    rnd = rand();
#if (RAND_MAX < 65536)
        rnd = rand()*(RAND_MAX + 1) + rnd;
#endif  //(RAND_MAX < 65536)
#endif  // WIN32
    return rnd;
}


float random_float()
{
    unsigned int rnd = 0;
#ifdef WIN32
    rand_s(&rnd);
    return ((float)rnd / (float)UINT_MAX);
#else   // WIN32

    rnd = rand();
#if (RAND_MAX < 65536)
    rnd = rand()*(RAND_MAX + 1) + rnd;
    return((float)rnd / (float)(RAND_MAX*RAND_MAX));
#endif  //(RAND_MAX < 65536)
    return ((float)rnd / (float)RAND_MAX);

#endif  // WIN32
}

float rand_uniform_strong(float min, float max)
{
    if (max < min) {
        float swap = min;
        min = max;
        max = swap;
    }
    return (random_float() * (max - min)) + min;
}

float rand_precalc_random(float min, float max, float random_part)
{
    if (max < min) {
        float swap = min;
        min = max;
        max = swap;
    }
    return (random_part * (max - min)) + min;
}

#define RS_SCALE (1.0 / (1.0 + RAND_MAX))

double double_rand(void)
{
    double d;
    do {
        d = (((rand() * RS_SCALE) + rand()) * RS_SCALE + rand()) * RS_SCALE;
    } while (d >= 1); // Round off
    return d;
}

unsigned int uint_rand(unsigned int less_than)
{
    return (unsigned int)((less_than)* double_rand());
}

//确认数组中是否有值为nan
int check_array_is_nan(float *arr, int size)
{
    int i;
    for (i = 0; i < size; ++i) {
        if (isnan(arr[i])) return 1;
    }
    return 0;
}

//确认数组中是否有浮点数是无限大
int check_array_is_inf(float *arr, int size)
{
    int i;
    for (i = 0; i < size; ++i) {
        if (isinf(arr[i])) return 1;
    }
    return 0;
}

//随机生成无序的整数数组
int *random_index_order(int min, int max)
{
    int *inds = (int *)xcalloc(max - min, sizeof(int));//临时空间
    int i;
    for (i = min; i < max; ++i) {
        inds[i - min] = i;//给数组inds赋值
    }
    for (i = min; i < max - 1; ++i) {
        int swap = inds[i - min];
        int index = i + rand() % (max - i);
        inds[i - min] = inds[index - min];
        inds[index - min] = swap;//交换任意序号的两个值
    }
    return inds;
}

// 一维int数组找最大值操作,若找到最大值,返回index,否则,返回-1;
int max_int_index(int *a, int n)
{
    if (n <= 0) return -1;
    int i, max_i = 0;
    int max = a[0];
    for (i = 1; i < n; ++i) {
        if (a[i] > max) {
            max = a[i];
            max_i = i;
        }
    }
    return max_i;
}


// Absolute box from relative coordinate bounding box and image size

//boxabs的定义我还没找到耶
boxabs box_to_boxabs(const box* b, const int img_w, const int img_h, const int bounds_check)
{
    boxabs ba;
    ba.left = (b->x - b->w / 2.)*img_w;
    ba.right = (b->x + b->w / 2.)*img_w;
    ba.top = (b->y - b->h / 2.)*img_h;
    ba.bot = (b->y + b->h / 2.)*img_h;//获得图片上的box的相对应位置

    if (bounds_check) {//边界限定
        if (ba.left < 0) ba.left = 0;
        if (ba.right > img_w - 1) ba.right = img_w - 1;
        if (ba.top < 0) ba.top = 0;
        if (ba.bot > img_h - 1) ba.bot = img_h - 1;
    }

    return ba;//返回转换的box
}

//创建文件夹
int make_directory(char *path, int mode)
{
#ifdef WIN32
    return _mkdir(path);
#else
    return mkdir(path, mode);
#endif
}

 

  • 1
    点赞
  • 0
    收藏
    觉得还不错? 一键收藏
  • 0
    评论

“相关推荐”对你有帮助么?

  • 非常没帮助
  • 没帮助
  • 一般
  • 有帮助
  • 非常有帮助
提交
评论
添加红包

请填写红包祝福语或标题

红包个数最小为10个

红包金额最低5元

当前余额3.43前往充值 >
需支付:10.00
成就一亿技术人!
领取后你会自动成为博主和红包主的粉丝 规则
hope_wisdom
发出的红包
实付
使用余额支付
点击重新获取
扫码支付
钱包余额 0

抵扣说明:

1.余额是钱包充值的虚拟货币,按照1:1的比例进行支付金额的抵扣。
2.余额无法直接购买下载,可以购买VIP、付费专栏及课程。

余额充值