25) HW3 Review

25) HW3 Review#

Today#

1. Review of HW3
1. Submission expectations and reminders

1. Review of HW3#

Solution to HW3. Here is my C code:

#include <argp.h>
#include <math.h>
#include <omp.h>
#include <stdbool.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>

struct Args {
  size_t length;
  size_t nreps;
  bool block;
  size_t unroll_factor;
};

// static memory variable declared here
static struct argp_option options[] = {
  {"length", 'S', "size_t", 0, "Length of each vector"},
  {"nreps", 'r', "size_t", 0, "Number of repetitions"},
  {"block", 'b', NULL, 0, "Compute block dot products (versus a single dot product)"}
};

static error_t parse_opt (int key, char *arg, struct argp_state *state)
{
  struct Args *args = state->input;
  switch (key) {
  case ARGP_KEY_INIT:
    args->length = 24;
    args->nreps = 10;
    args->block = false;
    break;
  case 'S':
    args->length = strtol(arg, NULL, 10);
    break;
  case 'r':
    args->nreps = strtol(arg, NULL, 10);
    break;
  case 'b':
    args->block = true;
    break;
  default:
    return ARGP_ERR_UNKNOWN;
  }
  return 0;
}

int I = 8;
int J = 4;
double tol = 1e-6;

int c_length[] = {3, 4};


// Function declarations here
double dot_product(int S, const double *a, const double *b);
double vector_norm(const double *a, int S);
int is_orthogonal(int S, const double *a, const double *b, double tol);
void bdot(int I, int S, int J, const double *m, const double *n, double *p);

double dot_product(int S, const double *a, const double *b){

    double sum = 0;
    for (int i = 0; i<S; i++)
        sum += a[i] * b[i];

    return sum;
}

double vector_norm(const double *a, int S){

    double sum = 0;
    for (int i = 0; i<S; i++)
        sum += pow(a[i],2);

    return sqrt(sum);
}

int is_orthogonal(int S, const double *a, const double *b, double tol){
    
    return (fabs(dot_product(S, a, b) <= tol));
 }

// Performs the operation
//   P = M * N
// where M and N have shape (I,S) and (S,J) respectively.
// This version stores M as row-major and N as column-major.
void bdot(int I, int S, int J, const double *m, const double *n, double *p){

    for (int i=0; i<I; i++) {
        for (int j=0; j<J; j++) {
            p[i*J+j] = dot_product(S, &m[i*S], &n[j*S]);
        }
    }
}

static void init_bdot(int I, int S, int J, double *m, double *n) {
    for (int s=0; s<S; s++) {
        for (int i=0; i<I; i++)
            m[i*S + s] = 1000*(i+1) + s+1;
        for (int j=0; j<J; j++)
            n[j*S + s] = 1./(1000*(j+1) + s+1);
    }
}


// Reference matrix-matrix multiply product implementation
void matrix_ref(int I, int S, int J, const double *m, const double *n, double *p){
    for (int i=0; i<I; i++) {
        for (int j=0; j<J; j++) {
            p[i*J+j] = 0.0;
            for (int s=0; s<S; s++) {
                p[i*J+j] += m[i*S + s] * n[j*S + s];
            }
        }
    }
}

static void report_dot(const char *name, const double result, const double ref_result) {

  if (fabs(result - ref_result) > 1e-10) {
    printf("Result = %f failed to validate with expected value %f\n", result, ref_result);
    return;
  }
  printf("%s matches the reference result.\n", name);
}

static void report_is_orthogonal(const char *name, const int result, const int ref_result) {
  if (result != ref_result) {
    printf("Result = %d failed to validate with expected value %d \n", result, ref_result);
    return;
  }
  printf("%s matches the reference result. The two vectors are %s \n", name, ref_result ? "orthogonal.": "not orthogonal.");
}

static void report_vector_norm(const char *name, const double result, const double ref_result) {

  if (fabs(result - ref_result) > 1e-10) {
    printf("Result = %f failed to validate with expected value %f\n", result, ref_result);
    return;
  }
  printf("%s matches the reference result.\n", name);
}

static void report_bdot(const char *name, int I, int J, const double *result, const double *ref_result) {
  if (result && ref_result && result != ref_result) {
    for (int i=0; i<I; i++) {
      for (int j=0; j<J; j++) {
        if (fabs(result[i*J + j] - ref_result[i*J + j]) > 1e-10) {
          printf("Result[%d,%d] = %f failed to validate with expected value %f\n", i, j, result[i*J + j], ref_result[i*J + j]);
          return;
        }
      }
    }
  }
  printf("%s matches the reference result.\n", name);
}


#define REPORT_BDOT(f, I, S, J, m, n, p, p_ref) do { \
        f(I, S, J, m, n, p);                         \
        report_bdot(#f, I, J, p, p_ref);             \
} while (0)

int main(int argc, char **argv){

    struct Args args;
    struct argp argp = {options, parse_opt, NULL, NULL};
    argp_parse(&argp, argc, argv, 0, 0, &args);
    size_t S = args.length;

    switch (args.block) {
    case false: { // single dot product case
        // stack memory variable declarations here
        double a1[] = {1, 0, 0};
        double b1[] = {0, 1, 0};
        double a2[] = {1, 2, 3, 4};
        double b2[] = {1, 1, 1, 1};

        // result of (a1,b1) and (a2,b2) dot products and reference values
        double c1, c2;
        double c1_ref = 0;
        double c2_ref = 10;

        // result of is_orthogonal 
        int flag1, flag2;
        int flag1_ref = 1; // a1 and b1 are orthogonal
        int flag2_ref = 0; // a2 and b2 are not orthogonal

        // result for vector_norm
        double na1, na2, nb1, nb2;
        double na1_ref = 1.0;
        double na2_ref = 5.477225575051661;
        double nb1_ref = 1.0;
        double nb2_ref = 2.0;

        // calls to your functions by reference here
        // print statements to show results
        c1 = dot_product(c_length[0], a1, b1);                               
        report_dot("dot_product of a1 and b1", c1, c1_ref); 
        c2 = dot_product(c_length[1], a2, b2);                               
        report_dot("dot_product of a2 and b2", c2, c2_ref); 

        flag1 = is_orthogonal(c_length[0], a1, b1, tol);
        report_is_orthogonal("is_orthogonal between a1 and b1", flag1, flag1_ref); 
        flag2 = is_orthogonal(c_length[1], a2, b2, tol);
        report_is_orthogonal("is_orthogonal between a2 and b2", flag2, flag2_ref); 

        na1 = vector_norm(a1, c_length[0]);
        nb1 = vector_norm(b1, c_length[0]);
        na2 = vector_norm(a2, c_length[1]);
        nb2 = vector_norm(b2, c_length[1]);
        report_vector_norm("vector_norm of a1", na1, na1_ref);
        report_vector_norm("vector_norm of a2", na2, na2_ref);
        report_vector_norm("vector_norm of b1", nb1, nb1_ref);
        report_vector_norm("vector_norm of b2", nb2, nb2_ref);

        } break;
        case true: { // blocked dot product case
            // Initialize the matrices (as flattened vectors)
            // heap memory allocations here
            double *m = malloc(I * S * sizeof(double));
            double *n = malloc(J * S * sizeof(double));
            double *p = malloc(I * J * sizeof(double));
            double *p_ref = malloc(I * J * sizeof(double));

            init_bdot(I, args.length, J, m, n);
            matrix_ref(I, S, J, m, n, p_ref);
            REPORT_BDOT(bdot, I, S, J, m, n, p, p_ref);

            // free allocated heap memory here
            free(m); free(n); free(p); free(p_ref);
    } break;
    }

    return 0;
}

This program can be compiled with the GNU C compiler with:

gcc dot.c -lm -o dot

and executed with

./dot

or

./dot -b

to test the blocked version.

Common mistakes#

Here is a list of common mistakes that a few people made:

Part 4: Not really implementing a blocked dot product between the rows of \(M\) and the columns of \(N\). The best way would have been reusing the dot_product function that was implemented for Part 1. This allows for code re-use, which is a good practice.
E.C.: not safely initializing to zero the output variable for the triple nested loop matrix-matrix multiplication. You could have achieved this by either invoking calloc instead of malloc or by manually initializing to zero all entries of the output variable (typically this is done right before the inner-most loop).

2. Submission expectations and reminders#

In general, when you receive an Assignment via a GitHub Classroom link, you want to clone your assignment repository, by doing

git clone your_assignment_repository_url

You can also work on a back-up repository or directory of your choice if you want to, for your scrap work, but you have to clone the assignment repository and submit your work there to be considered for submission and grading.
As soon as you clone your Assignment repository, move to that repository

cd your_assignment_repository

Create a new feature branch and switch to that. You can do this in two ways:
- git checkout -b name_of_your_branch
- git branch name_of_your_branch and then git checkout name_of_your_branch
Do NOT work directly off main
You can work on your feature branch as much as you like and create repeated incremental snapshots of your work via git commit. Always remember to use meaningful commit messages to remind yourself (and others) about your work in that moment in time. In a terminal you can simply do this by

git commit -m "Your commit message"

You can also write multi-line more detailed commit messages if you want. Just simply separate them with a space, and repeat the -m option, as in:

git commit -m "Your commit message" -m "Your more detailed message on a new line"

When you are satisfied with your committed work, you can push it to your working branch via:

git push origin your_branch_name

If it is the first time you are doing this, git will automatically tell you that you can open a Pull Request with your changes. Just CTRL-click on the URL that git shows you in the terminal and you will be sent to your Pull Request web interface.

Any successive changes that you want to push to your branch, they will be automatically reflected on the open PR.

Only changes made within the deadline (including the lateness window) will be graded.
Remember not to attempt to close or merge your PR without any Reviewer (in this case your instructor) approval.
Always remember to double check the File changed tab in your PR. If you see files that should not belong there (e.g., files automatically created by your IDE or virtual environment files) remove them.
If you are using an IDE that automatically creates hidden project files that you might inadvertently push to your branch, it is always a good practice to use a .gitignore file that specify which files you do not want to be tracked by git, and therefore, pushed to your branch. Recall that we covered this in our first lecture.

Reminder about the AI policy in this course#

A friendly reminder that in this course, we follow the University Senate’s extended definition of plagiarism that includes the un-cited use of generative AI applications, specifically: “representing work produced by generative Artificial Intelligence as one’s own.”

I provided in the Syllabus examples of how to properly cite the use of any genAI or LLM tool.